From 7fb2c1c48dee7dfb723fc12af176cc1e898957b9 Mon Sep 17 00:00:00 2001
From: Dinesh Yeduguru <yvdinesh@gmail.com>
Date: Wed, 15 Jan 2025 13:20:09 -0800
Subject: [PATCH] More idiomatic REST API (#765)

# What does this PR do?

This PR changes our API to follow more idiomatic REST API approaches of
having paths being resources and methods indicating the action being
performed.

Changes made to generator:
1) removed the prefix check of "get" as its not required and is actually
needed for other method types too
2) removed _ check on path since variables can have "_"


## Test Plan

LLAMA_STACK_BASE_URL=http://localhost:5000 pytest -v
tests/client-sdk/agents/test_agents.py
---
 .../openapi_generator/pyopenapi/operations.py |   58 +-
 docs/resources/llama-stack-spec.html          | 2173 +++++++++--------
 docs/resources/llama-stack-spec.yaml          | 1436 +++++------
 llama_stack/apis/agents/agents.py             |   44 +-
 .../apis/batch_inference/batch_inference.py   |    4 +-
 llama_stack/apis/datasetio/datasetio.py       |    4 +-
 llama_stack/apis/datasets/datasets.py         |   16 +-
 llama_stack/apis/eval/eval.py                 |   16 +-
 llama_stack/apis/eval_tasks/eval_tasks.py     |   18 +-
 llama_stack/apis/inference/inference.py       |    6 +-
 llama_stack/apis/inspect/inspect.py           |    6 +-
 llama_stack/apis/memory/memory.py             |    4 +-
 llama_stack/apis/memory_banks/memory_banks.py |   20 +-
 llama_stack/apis/models/models.py             |   24 +-
 .../apis/post_training/post_training.py       |    9 +-
 llama_stack/apis/safety/safety.py             |    3 +-
 llama_stack/apis/scoring/scoring.py           |    5 +-
 .../scoring_functions/scoring_functions.py    |   17 +-
 llama_stack/apis/shields/shields.py           |   12 +-
 llama_stack/apis/telemetry/telemetry.py       |    4 +-
 llama_stack/apis/tools/tools.py               |   36 +-
 .../distribution/routers/routing_tables.py    |   77 +-
 llama_stack/distribution/server/server.py     |   40 +-
 llama_stack/distribution/stack.py             |    6 +-
 .../agents/meta_reference/agent_instance.py   |    8 +-
 .../inline/agents/meta_reference/agents.py    |    2 +-
 .../post_training/torchtune/post_training.py  |    7 +-
 .../telemetry/meta_reference/telemetry.py     |    2 +-
 tests/client-sdk/agents/test_agents.py        |    4 +-
 29 files changed, 2144 insertions(+), 1917 deletions(-)

diff --git a/docs/openapi_generator/pyopenapi/operations.py b/docs/openapi_generator/pyopenapi/operations.py
index cc3a06b7b..4cea9d970 100644
--- a/docs/openapi_generator/pyopenapi/operations.py
+++ b/docs/openapi_generator/pyopenapi/operations.py
@@ -8,7 +8,6 @@ import collections.abc
 import enum
 import inspect
 import typing
-import uuid
 from dataclasses import dataclass
 from typing import Any, Callable, Dict, Iterable, Iterator, List, Optional, Tuple, Union
 
@@ -16,12 +15,7 @@ from llama_stack.apis.version import LLAMA_STACK_API_VERSION
 
 from termcolor import colored
 
-from ..strong_typing.inspection import (
-    get_signature,
-    is_type_enum,
-    is_type_optional,
-    unwrap_optional_type,
-)
+from ..strong_typing.inspection import get_signature
 
 
 def split_prefix(
@@ -113,9 +107,6 @@ class EndpointOperation:
 
     def get_route(self) -> str:
         if self.route is not None:
-            assert (
-                "_" not in self.route
-            ), f"route should not contain underscores: {self.route}"
             return "/".join(["", LLAMA_STACK_API_VERSION, self.route.lstrip("/")])
 
         route_parts = ["", LLAMA_STACK_API_VERSION, self.name]
@@ -265,42 +256,16 @@ def get_endpoint_operations(
                     f"parameter '{param_name}' in function '{func_name}' has no type annotation"
                 )
 
-            if is_type_optional(param_type):
-                inner_type: type = unwrap_optional_type(param_type)
-            else:
-                inner_type = param_type
-
-            if prefix == "get" and (
-                inner_type is bool
-                or inner_type is int
-                or inner_type is float
-                or inner_type is str
-                or inner_type is uuid.UUID
-                or is_type_enum(inner_type)
-            ):
-                if parameter.kind == inspect.Parameter.POSITIONAL_ONLY:
-                    if route_params is not None and param_name not in route_params:
-                        raise ValidationError(
-                            f"positional parameter '{param_name}' absent from user-defined route '{route}' for function '{func_name}'"
-                        )
-
-                    # simple type maps to route path element, e.g. /study/{uuid}/{version}
+            if prefix in ["get", "delete"]:
+                if route_params is not None and param_name in route_params:
                     path_params.append((param_name, param_type))
                 else:
-                    if route_params is not None and param_name in route_params:
-                        raise ValidationError(
-                            f"query parameter '{param_name}' found in user-defined route '{route}' for function '{func_name}'"
-                        )
-
-                    # simple type maps to key=value pair in query string
                     query_params.append((param_name, param_type))
             else:
                 if route_params is not None and param_name in route_params:
-                    raise ValidationError(
-                        f"user-defined route '{route}' for function '{func_name}' has parameter '{param_name}' of composite type: {param_type}"
-                    )
-
-                request_params.append((param_name, param_type))
+                    path_params.append((param_name, param_type))
+                else:
+                    request_params.append((param_name, param_type))
 
         # check if function has explicit return type
         if signature.return_annotation is inspect.Signature.empty:
@@ -335,19 +300,18 @@ def get_endpoint_operations(
 
             response_type = process_type(return_type)
 
-        # set HTTP request method based on type of request and presence of payload
-        if not request_params:
             if prefix in ["delete", "remove"]:
                 http_method = HTTPMethod.DELETE
-            else:
+            elif prefix == "post":
+                http_method = HTTPMethod.POST
+            elif prefix == "get":
                 http_method = HTTPMethod.GET
-        else:
-            if prefix == "set":
+            elif prefix == "set":
                 http_method = HTTPMethod.PUT
             elif prefix == "update":
                 http_method = HTTPMethod.PATCH
             else:
-                http_method = HTTPMethod.POST
+                raise ValidationError(f"unknown prefix {prefix}")
 
         result.append(
             EndpointOperation(
diff --git a/docs/resources/llama-stack-spec.html b/docs/resources/llama-stack-spec.html
index 3f74a79cf..2db33c87a 100644
--- a/docs/resources/llama-stack-spec.html
+++ b/docs/resources/llama-stack-spec.html
@@ -29,7 +29,76 @@
         }
     ],
     "paths": {
-        "/v1/datasetio/append-rows": {
+        "/v1/datasetio/rows": {
+            "get": {
+                "responses": {
+                    "200": {
+                        "description": "OK",
+                        "content": {
+                            "application/json": {
+                                "schema": {
+                                    "$ref": "#/components/schemas/PaginatedRowsResult"
+                                }
+                            }
+                        }
+                    }
+                },
+                "tags": [
+                    "DatasetIO"
+                ],
+                "parameters": [
+                    {
+                        "name": "dataset_id",
+                        "in": "query",
+                        "required": true,
+                        "schema": {
+                            "type": "string"
+                        }
+                    },
+                    {
+                        "name": "rows_in_page",
+                        "in": "query",
+                        "required": true,
+                        "schema": {
+                            "type": "integer"
+                        }
+                    },
+                    {
+                        "name": "page_token",
+                        "in": "query",
+                        "required": false,
+                        "schema": {
+                            "type": "string"
+                        }
+                    },
+                    {
+                        "name": "filter_condition",
+                        "in": "query",
+                        "required": false,
+                        "schema": {
+                            "type": "string"
+                        }
+                    },
+                    {
+                        "name": "X-LlamaStack-Provider-Data",
+                        "in": "header",
+                        "description": "JSON-encoded provider data which will be made available to the adapter servicing the API",
+                        "required": false,
+                        "schema": {
+                            "type": "string"
+                        }
+                    },
+                    {
+                        "name": "X-LlamaStack-Client-Version",
+                        "in": "header",
+                        "description": "Version of the client making the request. This is used to ensure that the client and server are compatible.",
+                        "required": false,
+                        "schema": {
+                            "type": "string"
+                        }
+                    }
+                ]
+            },
             "post": {
                 "responses": {
                     "200": {
@@ -323,7 +392,7 @@
                 }
             }
         },
-        "/v1/agents/create": {
+        "/v1/agents": {
             "post": {
                 "responses": {
                     "200": {
@@ -372,7 +441,7 @@
                 }
             }
         },
-        "/v1/agents/session/create": {
+        "/v1/agents/{agent_id}/session": {
             "post": {
                 "responses": {
                     "200": {
@@ -390,6 +459,14 @@
                     "Agents"
                 ],
                 "parameters": [
+                    {
+                        "name": "agent_id",
+                        "in": "path",
+                        "required": true,
+                        "schema": {
+                            "type": "string"
+                        }
+                    },
                     {
                         "name": "X-LlamaStack-Provider-Data",
                         "in": "header",
@@ -421,7 +498,7 @@
                 }
             }
         },
-        "/v1/agents/turn/create": {
+        "/v1/agents/{agent_id}/session/{session_id}/turn": {
             "post": {
                 "responses": {
                     "200": {
@@ -446,6 +523,22 @@
                     "Agents"
                 ],
                 "parameters": [
+                    {
+                        "name": "agent_id",
+                        "in": "path",
+                        "required": true,
+                        "schema": {
+                            "type": "string"
+                        }
+                    },
+                    {
+                        "name": "session_id",
+                        "in": "path",
+                        "required": true,
+                        "schema": {
+                            "type": "string"
+                        }
+                    },
                     {
                         "name": "X-LlamaStack-Provider-Data",
                         "in": "header",
@@ -477,8 +570,8 @@
                 }
             }
         },
-        "/v1/agents/delete": {
-            "post": {
+        "/v1/agents/{agent_id}": {
+            "delete": {
                 "responses": {
                     "200": {
                         "description": "OK"
@@ -488,6 +581,14 @@
                     "Agents"
                 ],
                 "parameters": [
+                    {
+                        "name": "agent_id",
+                        "in": "path",
+                        "required": true,
+                        "schema": {
+                            "type": "string"
+                        }
+                    },
                     {
                         "name": "X-LlamaStack-Provider-Data",
                         "in": "header",
@@ -506,30 +607,54 @@
                             "type": "string"
                         }
                     }
-                ],
-                "requestBody": {
-                    "content": {
-                        "application/json": {
-                            "schema": {
-                                "$ref": "#/components/schemas/DeleteAgentsRequest"
-                            }
-                        }
-                    },
-                    "required": true
-                }
+                ]
             }
         },
-        "/v1/agents/session/delete": {
-            "post": {
+        "/v1/agents/{agent_id}/session/{session_id}": {
+            "get": {
                 "responses": {
                     "200": {
-                        "description": "OK"
+                        "description": "OK",
+                        "content": {
+                            "application/json": {
+                                "schema": {
+                                    "$ref": "#/components/schemas/Session"
+                                }
+                            }
+                        }
                     }
                 },
                 "tags": [
                     "Agents"
                 ],
                 "parameters": [
+                    {
+                        "name": "session_id",
+                        "in": "path",
+                        "required": true,
+                        "schema": {
+                            "type": "string"
+                        }
+                    },
+                    {
+                        "name": "agent_id",
+                        "in": "path",
+                        "required": true,
+                        "schema": {
+                            "type": "string"
+                        }
+                    },
+                    {
+                        "name": "turn_ids",
+                        "in": "query",
+                        "required": false,
+                        "schema": {
+                            "type": "array",
+                            "items": {
+                                "type": "string"
+                            }
+                        }
+                    },
                     {
                         "name": "X-LlamaStack-Provider-Data",
                         "in": "header",
@@ -548,17 +673,53 @@
                             "type": "string"
                         }
                     }
+                ]
+            },
+            "delete": {
+                "responses": {
+                    "200": {
+                        "description": "OK"
+                    }
+                },
+                "tags": [
+                    "Agents"
                 ],
-                "requestBody": {
-                    "content": {
-                        "application/json": {
-                            "schema": {
-                                "$ref": "#/components/schemas/DeleteAgentsSessionRequest"
-                            }
+                "parameters": [
+                    {
+                        "name": "session_id",
+                        "in": "path",
+                        "required": true,
+                        "schema": {
+                            "type": "string"
                         }
                     },
-                    "required": true
-                }
+                    {
+                        "name": "agent_id",
+                        "in": "path",
+                        "required": true,
+                        "schema": {
+                            "type": "string"
+                        }
+                    },
+                    {
+                        "name": "X-LlamaStack-Provider-Data",
+                        "in": "header",
+                        "description": "JSON-encoded provider data which will be made available to the adapter servicing the API",
+                        "required": false,
+                        "schema": {
+                            "type": "string"
+                        }
+                    },
+                    {
+                        "name": "X-LlamaStack-Client-Version",
+                        "in": "header",
+                        "description": "Version of the client making the request. This is used to ensure that the client and server are compatible.",
+                        "required": false,
+                        "schema": {
+                            "type": "string"
+                        }
+                    }
+                ]
             }
         },
         "/v1/inference/embeddings": {
@@ -659,72 +820,7 @@
                 }
             }
         },
-        "/v1/agents/session/get": {
-            "post": {
-                "responses": {
-                    "200": {
-                        "description": "OK",
-                        "content": {
-                            "application/json": {
-                                "schema": {
-                                    "$ref": "#/components/schemas/Session"
-                                }
-                            }
-                        }
-                    }
-                },
-                "tags": [
-                    "Agents"
-                ],
-                "parameters": [
-                    {
-                        "name": "agent_id",
-                        "in": "query",
-                        "required": true,
-                        "schema": {
-                            "type": "string"
-                        }
-                    },
-                    {
-                        "name": "session_id",
-                        "in": "query",
-                        "required": true,
-                        "schema": {
-                            "type": "string"
-                        }
-                    },
-                    {
-                        "name": "X-LlamaStack-Provider-Data",
-                        "in": "header",
-                        "description": "JSON-encoded provider data which will be made available to the adapter servicing the API",
-                        "required": false,
-                        "schema": {
-                            "type": "string"
-                        }
-                    },
-                    {
-                        "name": "X-LlamaStack-Client-Version",
-                        "in": "header",
-                        "description": "Version of the client making the request. This is used to ensure that the client and server are compatible.",
-                        "required": false,
-                        "schema": {
-                            "type": "string"
-                        }
-                    }
-                ],
-                "requestBody": {
-                    "content": {
-                        "application/json": {
-                            "schema": {
-                                "$ref": "#/components/schemas/GetAgentsSessionRequest"
-                            }
-                        }
-                    },
-                    "required": true
-                }
-            }
-        },
-        "/v1/agents/step/get": {
+        "/v1/agents/{agent_id}/session/{session_id}/turn/{turn_id}/step/{step_id}": {
             "get": {
                 "responses": {
                     "200": {
@@ -744,7 +840,7 @@
                 "parameters": [
                     {
                         "name": "agent_id",
-                        "in": "query",
+                        "in": "path",
                         "required": true,
                         "schema": {
                             "type": "string"
@@ -752,7 +848,7 @@
                     },
                     {
                         "name": "session_id",
-                        "in": "query",
+                        "in": "path",
                         "required": true,
                         "schema": {
                             "type": "string"
@@ -760,7 +856,7 @@
                     },
                     {
                         "name": "turn_id",
-                        "in": "query",
+                        "in": "path",
                         "required": true,
                         "schema": {
                             "type": "string"
@@ -768,7 +864,7 @@
                     },
                     {
                         "name": "step_id",
-                        "in": "query",
+                        "in": "path",
                         "required": true,
                         "schema": {
                             "type": "string"
@@ -795,7 +891,7 @@
                 ]
             }
         },
-        "/v1/agents/turn/get": {
+        "/v1/agents/{agent_id}/session/{session_id}/turn/{turn_id}": {
             "get": {
                 "responses": {
                     "200": {
@@ -815,7 +911,7 @@
                 "parameters": [
                     {
                         "name": "agent_id",
-                        "in": "query",
+                        "in": "path",
                         "required": true,
                         "schema": {
                             "type": "string"
@@ -823,7 +919,7 @@
                     },
                     {
                         "name": "session_id",
-                        "in": "query",
+                        "in": "path",
                         "required": true,
                         "schema": {
                             "type": "string"
@@ -831,7 +927,7 @@
                     },
                     {
                         "name": "turn_id",
-                        "in": "query",
+                        "in": "path",
                         "required": true,
                         "schema": {
                             "type": "string"
@@ -858,7 +954,7 @@
                 ]
             }
         },
-        "/v1/datasets/get": {
+        "/v1/datasets/{dataset_id}": {
             "get": {
                 "responses": {
                     "200": {
@@ -885,7 +981,45 @@
                 "parameters": [
                     {
                         "name": "dataset_id",
-                        "in": "query",
+                        "in": "path",
+                        "required": true,
+                        "schema": {
+                            "type": "string"
+                        }
+                    },
+                    {
+                        "name": "X-LlamaStack-Provider-Data",
+                        "in": "header",
+                        "description": "JSON-encoded provider data which will be made available to the adapter servicing the API",
+                        "required": false,
+                        "schema": {
+                            "type": "string"
+                        }
+                    },
+                    {
+                        "name": "X-LlamaStack-Client-Version",
+                        "in": "header",
+                        "description": "Version of the client making the request. This is used to ensure that the client and server are compatible.",
+                        "required": false,
+                        "schema": {
+                            "type": "string"
+                        }
+                    }
+                ]
+            },
+            "delete": {
+                "responses": {
+                    "200": {
+                        "description": "OK"
+                    }
+                },
+                "tags": [
+                    "Datasets"
+                ],
+                "parameters": [
+                    {
+                        "name": "dataset_id",
+                        "in": "path",
                         "required": true,
                         "schema": {
                             "type": "string"
@@ -912,7 +1046,7 @@
                 ]
             }
         },
-        "/v1/eval-tasks/get": {
+        "/v1/eval-tasks/{eval_task_id}": {
             "get": {
                 "responses": {
                     "200": {
@@ -938,8 +1072,8 @@
                 ],
                 "parameters": [
                     {
-                        "name": "name",
-                        "in": "query",
+                        "name": "eval_task_id",
+                        "in": "path",
                         "required": true,
                         "schema": {
                             "type": "string"
@@ -966,7 +1100,7 @@
                 ]
             }
         },
-        "/v1/memory-banks/get": {
+        "/v1/memory-banks/{memory_bank_id}": {
             "get": {
                 "responses": {
                     "200": {
@@ -993,7 +1127,45 @@
                 "parameters": [
                     {
                         "name": "memory_bank_id",
-                        "in": "query",
+                        "in": "path",
+                        "required": true,
+                        "schema": {
+                            "type": "string"
+                        }
+                    },
+                    {
+                        "name": "X-LlamaStack-Provider-Data",
+                        "in": "header",
+                        "description": "JSON-encoded provider data which will be made available to the adapter servicing the API",
+                        "required": false,
+                        "schema": {
+                            "type": "string"
+                        }
+                    },
+                    {
+                        "name": "X-LlamaStack-Client-Version",
+                        "in": "header",
+                        "description": "Version of the client making the request. This is used to ensure that the client and server are compatible.",
+                        "required": false,
+                        "schema": {
+                            "type": "string"
+                        }
+                    }
+                ]
+            },
+            "delete": {
+                "responses": {
+                    "200": {
+                        "description": "OK"
+                    }
+                },
+                "tags": [
+                    "MemoryBanks"
+                ],
+                "parameters": [
+                    {
+                        "name": "memory_bank_id",
+                        "in": "path",
                         "required": true,
                         "schema": {
                             "type": "string"
@@ -1020,7 +1192,7 @@
                 ]
             }
         },
-        "/v1/models/get": {
+        "/v1/models/{model_id}": {
             "get": {
                 "responses": {
                     "200": {
@@ -1046,8 +1218,8 @@
                 ],
                 "parameters": [
                     {
-                        "name": "identifier",
-                        "in": "query",
+                        "name": "model_id",
+                        "in": "path",
                         "required": true,
                         "schema": {
                             "type": "string"
@@ -1072,58 +1244,25 @@
                         }
                     }
                 ]
-            }
-        },
-        "/v1/datasetio/get-rows-paginated": {
-            "get": {
+            },
+            "delete": {
                 "responses": {
                     "200": {
-                        "description": "OK",
-                        "content": {
-                            "application/json": {
-                                "schema": {
-                                    "$ref": "#/components/schemas/PaginatedRowsResult"
-                                }
-                            }
-                        }
+                        "description": "OK"
                     }
                 },
                 "tags": [
-                    "DatasetIO"
+                    "Models"
                 ],
                 "parameters": [
                     {
-                        "name": "dataset_id",
-                        "in": "query",
+                        "name": "model_id",
+                        "in": "path",
                         "required": true,
                         "schema": {
                             "type": "string"
                         }
                     },
-                    {
-                        "name": "rows_in_page",
-                        "in": "query",
-                        "required": true,
-                        "schema": {
-                            "type": "integer"
-                        }
-                    },
-                    {
-                        "name": "page_token",
-                        "in": "query",
-                        "required": false,
-                        "schema": {
-                            "type": "string"
-                        }
-                    },
-                    {
-                        "name": "filter_condition",
-                        "in": "query",
-                        "required": false,
-                        "schema": {
-                            "type": "string"
-                        }
-                    },
                     {
                         "name": "X-LlamaStack-Provider-Data",
                         "in": "header",
@@ -1145,7 +1284,7 @@
                 ]
             }
         },
-        "/v1/scoring-functions/get": {
+        "/v1/scoring-functions/{scoring_fn_id}": {
             "get": {
                 "responses": {
                     "200": {
@@ -1172,7 +1311,7 @@
                 "parameters": [
                     {
                         "name": "scoring_fn_id",
-                        "in": "query",
+                        "in": "path",
                         "required": true,
                         "schema": {
                             "type": "string"
@@ -1199,7 +1338,7 @@
                 ]
             }
         },
-        "/v1/shields/get": {
+        "/v1/shields/{identifier}": {
             "get": {
                 "responses": {
                     "200": {
@@ -1226,7 +1365,7 @@
                 "parameters": [
                     {
                         "name": "identifier",
-                        "in": "query",
+                        "in": "path",
                         "required": true,
                         "schema": {
                             "type": "string"
@@ -1253,75 +1392,7 @@
                 ]
             }
         },
-        "/v1/telemetry/get-span-tree": {
-            "post": {
-                "responses": {
-                    "200": {
-                        "description": "OK",
-                        "content": {
-                            "application/json": {
-                                "schema": {
-                                    "type": "object",
-                                    "additionalProperties": {
-                                        "$ref": "#/components/schemas/SpanWithStatus"
-                                    }
-                                }
-                            }
-                        }
-                    }
-                },
-                "tags": [
-                    "Telemetry"
-                ],
-                "parameters": [
-                    {
-                        "name": "span_id",
-                        "in": "query",
-                        "required": true,
-                        "schema": {
-                            "type": "string"
-                        }
-                    },
-                    {
-                        "name": "max_depth",
-                        "in": "query",
-                        "required": false,
-                        "schema": {
-                            "type": "integer"
-                        }
-                    },
-                    {
-                        "name": "X-LlamaStack-Provider-Data",
-                        "in": "header",
-                        "description": "JSON-encoded provider data which will be made available to the adapter servicing the API",
-                        "required": false,
-                        "schema": {
-                            "type": "string"
-                        }
-                    },
-                    {
-                        "name": "X-LlamaStack-Client-Version",
-                        "in": "header",
-                        "description": "Version of the client making the request. This is used to ensure that the client and server are compatible.",
-                        "required": false,
-                        "schema": {
-                            "type": "string"
-                        }
-                    }
-                ],
-                "requestBody": {
-                    "content": {
-                        "application/json": {
-                            "schema": {
-                                "$ref": "#/components/schemas/GetSpanTreeRequest"
-                            }
-                        }
-                    },
-                    "required": true
-                }
-            }
-        },
-        "/v1/tools/get": {
+        "/v1/tools/{tool_name}": {
             "get": {
                 "responses": {
                     "200": {
@@ -1341,7 +1412,7 @@
                 "parameters": [
                     {
                         "name": "tool_name",
-                        "in": "query",
+                        "in": "path",
                         "required": true,
                         "schema": {
                             "type": "string"
@@ -1368,7 +1439,7 @@
                 ]
             }
         },
-        "/v1/toolgroups/get": {
+        "/v1/toolgroups/{toolgroup_id}": {
             "get": {
                 "responses": {
                     "200": {
@@ -1388,7 +1459,46 @@
                 "parameters": [
                     {
                         "name": "toolgroup_id",
-                        "in": "query",
+                        "in": "path",
+                        "required": true,
+                        "schema": {
+                            "type": "string"
+                        }
+                    },
+                    {
+                        "name": "X-LlamaStack-Provider-Data",
+                        "in": "header",
+                        "description": "JSON-encoded provider data which will be made available to the adapter servicing the API",
+                        "required": false,
+                        "schema": {
+                            "type": "string"
+                        }
+                    },
+                    {
+                        "name": "X-LlamaStack-Client-Version",
+                        "in": "header",
+                        "description": "Version of the client making the request. This is used to ensure that the client and server are compatible.",
+                        "required": false,
+                        "schema": {
+                            "type": "string"
+                        }
+                    }
+                ]
+            },
+            "delete": {
+                "responses": {
+                    "200": {
+                        "description": "OK"
+                    }
+                },
+                "tags": [
+                    "ToolGroups"
+                ],
+                "summary": "Unregister a tool group",
+                "parameters": [
+                    {
+                        "name": "toolgroup_id",
+                        "in": "path",
                         "required": true,
                         "schema": {
                             "type": "string"
@@ -1529,9 +1639,9 @@
                     "200": {
                         "description": "OK",
                         "content": {
-                            "application/jsonl": {
+                            "application/json": {
                                 "schema": {
-                                    "$ref": "#/components/schemas/PostTrainingJob"
+                                    "$ref": "#/components/schemas/ListPostTrainingJobsResponse"
                                 }
                             }
                         }
@@ -1693,7 +1803,7 @@
                 }
             }
         },
-        "/v1/eval/job/cancel": {
+        "/v1/eval/jobs/cancel": {
             "post": {
                 "responses": {
                     "200": {
@@ -1735,7 +1845,7 @@
                 }
             }
         },
-        "/v1/eval/job/result": {
+        "/v1/eval/jobs/{job_id}/result": {
             "get": {
                 "responses": {
                     "200": {
@@ -1754,15 +1864,15 @@
                 ],
                 "parameters": [
                     {
-                        "name": "task_id",
-                        "in": "query",
+                        "name": "job_id",
+                        "in": "path",
                         "required": true,
                         "schema": {
                             "type": "string"
                         }
                     },
                     {
-                        "name": "job_id",
+                        "name": "task_id",
                         "in": "query",
                         "required": true,
                         "schema": {
@@ -1790,7 +1900,7 @@
                 ]
             }
         },
-        "/v1/eval/job/status": {
+        "/v1/eval/jobs/{job_id}": {
             "get": {
                 "responses": {
                     "200": {
@@ -1816,15 +1926,15 @@
                 ],
                 "parameters": [
                     {
-                        "name": "task_id",
-                        "in": "query",
+                        "name": "job_id",
+                        "in": "path",
                         "required": true,
                         "schema": {
                             "type": "string"
                         }
                     },
                     {
-                        "name": "job_id",
+                        "name": "task_id",
                         "in": "query",
                         "required": true,
                         "schema": {
@@ -1852,15 +1962,15 @@
                 ]
             }
         },
-        "/v1/datasets/list": {
+        "/v1/datasets": {
             "get": {
                 "responses": {
                     "200": {
                         "description": "OK",
                         "content": {
-                            "application/jsonl": {
+                            "application/json": {
                                 "schema": {
-                                    "$ref": "#/components/schemas/Dataset"
+                                    "$ref": "#/components/schemas/ListDatasetsResponse"
                                 }
                             }
                         }
@@ -1889,17 +1999,57 @@
                         }
                     }
                 ]
+            },
+            "post": {
+                "responses": {
+                    "200": {
+                        "description": "OK"
+                    }
+                },
+                "tags": [
+                    "Datasets"
+                ],
+                "parameters": [
+                    {
+                        "name": "X-LlamaStack-Provider-Data",
+                        "in": "header",
+                        "description": "JSON-encoded provider data which will be made available to the adapter servicing the API",
+                        "required": false,
+                        "schema": {
+                            "type": "string"
+                        }
+                    },
+                    {
+                        "name": "X-LlamaStack-Client-Version",
+                        "in": "header",
+                        "description": "Version of the client making the request. This is used to ensure that the client and server are compatible.",
+                        "required": false,
+                        "schema": {
+                            "type": "string"
+                        }
+                    }
+                ],
+                "requestBody": {
+                    "content": {
+                        "application/json": {
+                            "schema": {
+                                "$ref": "#/components/schemas/RegisterDatasetRequest"
+                            }
+                        }
+                    },
+                    "required": true
+                }
             }
         },
-        "/v1/eval-tasks/list": {
+        "/v1/eval-tasks": {
             "get": {
                 "responses": {
                     "200": {
                         "description": "OK",
                         "content": {
-                            "application/jsonl": {
+                            "application/json": {
                                 "schema": {
-                                    "$ref": "#/components/schemas/EvalTask"
+                                    "$ref": "#/components/schemas/ListEvalTasksResponse"
                                 }
                             }
                         }
@@ -1928,17 +2078,57 @@
                         }
                     }
                 ]
+            },
+            "post": {
+                "responses": {
+                    "200": {
+                        "description": "OK"
+                    }
+                },
+                "tags": [
+                    "EvalTasks"
+                ],
+                "parameters": [
+                    {
+                        "name": "X-LlamaStack-Provider-Data",
+                        "in": "header",
+                        "description": "JSON-encoded provider data which will be made available to the adapter servicing the API",
+                        "required": false,
+                        "schema": {
+                            "type": "string"
+                        }
+                    },
+                    {
+                        "name": "X-LlamaStack-Client-Version",
+                        "in": "header",
+                        "description": "Version of the client making the request. This is used to ensure that the client and server are compatible.",
+                        "required": false,
+                        "schema": {
+                            "type": "string"
+                        }
+                    }
+                ],
+                "requestBody": {
+                    "content": {
+                        "application/json": {
+                            "schema": {
+                                "$ref": "#/components/schemas/RegisterEvalTaskRequest"
+                            }
+                        }
+                    },
+                    "required": true
+                }
             }
         },
-        "/v1/memory-banks/list": {
+        "/v1/memory-banks": {
             "get": {
                 "responses": {
                     "200": {
                         "description": "OK",
                         "content": {
-                            "application/jsonl": {
+                            "application/json": {
                                 "schema": {
-                                    "$ref": "#/components/schemas/MemoryBank"
+                                    "$ref": "#/components/schemas/ListMemoryBanksResponse"
                                 }
                             }
                         }
@@ -1967,15 +2157,112 @@
                         }
                     }
                 ]
+            },
+            "post": {
+                "responses": {
+                    "200": {
+                        "description": "",
+                        "content": {
+                            "application/json": {
+                                "schema": {
+                                    "oneOf": [
+                                        {
+                                            "$ref": "#/components/schemas/VectorMemoryBank"
+                                        },
+                                        {
+                                            "$ref": "#/components/schemas/KeyValueMemoryBank"
+                                        },
+                                        {
+                                            "$ref": "#/components/schemas/KeywordMemoryBank"
+                                        },
+                                        {
+                                            "$ref": "#/components/schemas/GraphMemoryBank"
+                                        }
+                                    ]
+                                }
+                            }
+                        }
+                    }
+                },
+                "tags": [
+                    "MemoryBanks"
+                ],
+                "parameters": [
+                    {
+                        "name": "X-LlamaStack-Provider-Data",
+                        "in": "header",
+                        "description": "JSON-encoded provider data which will be made available to the adapter servicing the API",
+                        "required": false,
+                        "schema": {
+                            "type": "string"
+                        }
+                    },
+                    {
+                        "name": "X-LlamaStack-Client-Version",
+                        "in": "header",
+                        "description": "Version of the client making the request. This is used to ensure that the client and server are compatible.",
+                        "required": false,
+                        "schema": {
+                            "type": "string"
+                        }
+                    }
+                ],
+                "requestBody": {
+                    "content": {
+                        "application/json": {
+                            "schema": {
+                                "$ref": "#/components/schemas/RegisterMemoryBankRequest"
+                            }
+                        }
+                    },
+                    "required": true
+                }
             }
         },
-        "/v1/models/list": {
+        "/v1/models": {
             "get": {
                 "responses": {
                     "200": {
                         "description": "OK",
                         "content": {
-                            "application/jsonl": {
+                            "application/json": {
+                                "schema": {
+                                    "$ref": "#/components/schemas/ListModelsResponse"
+                                }
+                            }
+                        }
+                    }
+                },
+                "tags": [
+                    "Models"
+                ],
+                "parameters": [
+                    {
+                        "name": "X-LlamaStack-Provider-Data",
+                        "in": "header",
+                        "description": "JSON-encoded provider data which will be made available to the adapter servicing the API",
+                        "required": false,
+                        "schema": {
+                            "type": "string"
+                        }
+                    },
+                    {
+                        "name": "X-LlamaStack-Client-Version",
+                        "in": "header",
+                        "description": "Version of the client making the request. This is used to ensure that the client and server are compatible.",
+                        "required": false,
+                        "schema": {
+                            "type": "string"
+                        }
+                    }
+                ]
+            },
+            "post": {
+                "responses": {
+                    "200": {
+                        "description": "OK",
+                        "content": {
+                            "application/json": {
                                 "schema": {
                                     "$ref": "#/components/schemas/Model"
                                 }
@@ -2005,7 +2292,17 @@
                             "type": "string"
                         }
                     }
-                ]
+                ],
+                "requestBody": {
+                    "content": {
+                        "application/json": {
+                            "schema": {
+                                "$ref": "#/components/schemas/RegisterModelRequest"
+                            }
+                        }
+                    },
+                    "required": true
+                }
             }
         },
         "/v1/providers/list": {
@@ -2016,10 +2313,7 @@
                         "content": {
                             "application/json": {
                                 "schema": {
-                                    "type": "object",
-                                    "additionalProperties": {
-                                        "$ref": "#/components/schemas/ProviderInfo"
-                                    }
+                                    "$ref": "#/components/schemas/ListProvidersResponse"
                                 }
                             }
                         }
@@ -2096,7 +2390,7 @@
             }
         },
         "/v1/tool-runtime/list-tools": {
-            "post": {
+            "get": {
                 "responses": {
                     "200": {
                         "description": "OK",
@@ -2121,6 +2415,14 @@
                             "type": "string"
                         }
                     },
+                    {
+                        "name": "mcp_endpoint",
+                        "in": "query",
+                        "required": false,
+                        "schema": {
+                            "$ref": "#/components/schemas/URL"
+                        }
+                    },
                     {
                         "name": "X-LlamaStack-Provider-Data",
                         "in": "header",
@@ -2139,28 +2441,18 @@
                             "type": "string"
                         }
                     }
-                ],
-                "requestBody": {
-                    "content": {
-                        "application/json": {
-                            "schema": {
-                                "$ref": "#/components/schemas/ListRuntimeToolsRequest"
-                            }
-                        }
-                    },
-                    "required": true
-                }
+                ]
             }
         },
-        "/v1/scoring-functions/list": {
+        "/v1/scoring-functions": {
             "get": {
                 "responses": {
                     "200": {
                         "description": "OK",
                         "content": {
-                            "application/jsonl": {
+                            "application/json": {
                                 "schema": {
-                                    "$ref": "#/components/schemas/ScoringFn"
+                                    "$ref": "#/components/schemas/ListScoringFunctionsResponse"
                                 }
                             }
                         }
@@ -2189,15 +2481,92 @@
                         }
                     }
                 ]
+            },
+            "post": {
+                "responses": {
+                    "200": {
+                        "description": "OK"
+                    }
+                },
+                "tags": [
+                    "ScoringFunctions"
+                ],
+                "parameters": [
+                    {
+                        "name": "X-LlamaStack-Provider-Data",
+                        "in": "header",
+                        "description": "JSON-encoded provider data which will be made available to the adapter servicing the API",
+                        "required": false,
+                        "schema": {
+                            "type": "string"
+                        }
+                    },
+                    {
+                        "name": "X-LlamaStack-Client-Version",
+                        "in": "header",
+                        "description": "Version of the client making the request. This is used to ensure that the client and server are compatible.",
+                        "required": false,
+                        "schema": {
+                            "type": "string"
+                        }
+                    }
+                ],
+                "requestBody": {
+                    "content": {
+                        "application/json": {
+                            "schema": {
+                                "$ref": "#/components/schemas/RegisterScoringFunctionRequest"
+                            }
+                        }
+                    },
+                    "required": true
+                }
             }
         },
-        "/v1/shields/list": {
+        "/v1/shields": {
             "get": {
                 "responses": {
                     "200": {
                         "description": "OK",
                         "content": {
-                            "application/jsonl": {
+                            "application/json": {
+                                "schema": {
+                                    "$ref": "#/components/schemas/ListShieldsResponse"
+                                }
+                            }
+                        }
+                    }
+                },
+                "tags": [
+                    "Shields"
+                ],
+                "parameters": [
+                    {
+                        "name": "X-LlamaStack-Provider-Data",
+                        "in": "header",
+                        "description": "JSON-encoded provider data which will be made available to the adapter servicing the API",
+                        "required": false,
+                        "schema": {
+                            "type": "string"
+                        }
+                    },
+                    {
+                        "name": "X-LlamaStack-Client-Version",
+                        "in": "header",
+                        "description": "Version of the client making the request. This is used to ensure that the client and server are compatible.",
+                        "required": false,
+                        "schema": {
+                            "type": "string"
+                        }
+                    }
+                ]
+            },
+            "post": {
+                "responses": {
+                    "200": {
+                        "description": "OK",
+                        "content": {
+                            "application/json": {
                                 "schema": {
                                     "$ref": "#/components/schemas/Shield"
                                 }
@@ -2227,18 +2596,28 @@
                             "type": "string"
                         }
                     }
-                ]
+                ],
+                "requestBody": {
+                    "content": {
+                        "application/json": {
+                            "schema": {
+                                "$ref": "#/components/schemas/RegisterShieldRequest"
+                            }
+                        }
+                    },
+                    "required": true
+                }
             }
         },
-        "/v1/toolgroups/list": {
+        "/v1/toolgroups": {
             "get": {
                 "responses": {
                     "200": {
                         "description": "OK",
                         "content": {
-                            "application/jsonl": {
+                            "application/json": {
                                 "schema": {
-                                    "$ref": "#/components/schemas/ToolGroup"
+                                    "$ref": "#/components/schemas/ListToolGroupsResponse"
                                 }
                             }
                         }
@@ -2268,17 +2647,58 @@
                         }
                     }
                 ]
+            },
+            "post": {
+                "responses": {
+                    "200": {
+                        "description": "OK"
+                    }
+                },
+                "tags": [
+                    "ToolGroups"
+                ],
+                "summary": "Register a tool group",
+                "parameters": [
+                    {
+                        "name": "X-LlamaStack-Provider-Data",
+                        "in": "header",
+                        "description": "JSON-encoded provider data which will be made available to the adapter servicing the API",
+                        "required": false,
+                        "schema": {
+                            "type": "string"
+                        }
+                    },
+                    {
+                        "name": "X-LlamaStack-Client-Version",
+                        "in": "header",
+                        "description": "Version of the client making the request. This is used to ensure that the client and server are compatible.",
+                        "required": false,
+                        "schema": {
+                            "type": "string"
+                        }
+                    }
+                ],
+                "requestBody": {
+                    "content": {
+                        "application/json": {
+                            "schema": {
+                                "$ref": "#/components/schemas/RegisterToolGroupRequest"
+                            }
+                        }
+                    },
+                    "required": true
+                }
             }
         },
-        "/v1/tools/list": {
+        "/v1/tools": {
             "get": {
                 "responses": {
                     "200": {
                         "description": "OK",
                         "content": {
-                            "application/jsonl": {
+                            "application/json": {
                                 "schema": {
-                                    "$ref": "#/components/schemas/Tool"
+                                    "$ref": "#/components/schemas/ListToolsResponse"
                                 }
                             }
                         }
@@ -2290,7 +2710,7 @@
                 "summary": "List tools with optional tool group",
                 "parameters": [
                     {
-                        "name": "tool_group_id",
+                        "name": "toolgroup_id",
                         "in": "query",
                         "required": false,
                         "schema": {
@@ -2458,6 +2878,58 @@
                 }
             }
         },
+        "/v1/telemetry/query-span-tree": {
+            "post": {
+                "responses": {
+                    "200": {
+                        "description": "OK",
+                        "content": {
+                            "application/json": {
+                                "schema": {
+                                    "type": "object",
+                                    "additionalProperties": {
+                                        "$ref": "#/components/schemas/SpanWithStatus"
+                                    }
+                                }
+                            }
+                        }
+                    }
+                },
+                "tags": [
+                    "Telemetry"
+                ],
+                "parameters": [
+                    {
+                        "name": "X-LlamaStack-Provider-Data",
+                        "in": "header",
+                        "description": "JSON-encoded provider data which will be made available to the adapter servicing the API",
+                        "required": false,
+                        "schema": {
+                            "type": "string"
+                        }
+                    },
+                    {
+                        "name": "X-LlamaStack-Client-Version",
+                        "in": "header",
+                        "description": "Version of the client making the request. This is used to ensure that the client and server are compatible.",
+                        "required": false,
+                        "schema": {
+                            "type": "string"
+                        }
+                    }
+                ],
+                "requestBody": {
+                    "content": {
+                        "application/json": {
+                            "schema": {
+                                "$ref": "#/components/schemas/QuerySpanTreeRequest"
+                            }
+                        }
+                    },
+                    "required": true
+                }
+            }
+        },
         "/v1/telemetry/query-spans": {
             "post": {
                 "responses": {
@@ -2556,336 +3028,7 @@
                 }
             }
         },
-        "/v1/datasets/register": {
-            "post": {
-                "responses": {
-                    "200": {
-                        "description": "OK"
-                    }
-                },
-                "tags": [
-                    "Datasets"
-                ],
-                "parameters": [
-                    {
-                        "name": "X-LlamaStack-Provider-Data",
-                        "in": "header",
-                        "description": "JSON-encoded provider data which will be made available to the adapter servicing the API",
-                        "required": false,
-                        "schema": {
-                            "type": "string"
-                        }
-                    },
-                    {
-                        "name": "X-LlamaStack-Client-Version",
-                        "in": "header",
-                        "description": "Version of the client making the request. This is used to ensure that the client and server are compatible.",
-                        "required": false,
-                        "schema": {
-                            "type": "string"
-                        }
-                    }
-                ],
-                "requestBody": {
-                    "content": {
-                        "application/json": {
-                            "schema": {
-                                "$ref": "#/components/schemas/RegisterDatasetRequest"
-                            }
-                        }
-                    },
-                    "required": true
-                }
-            }
-        },
-        "/v1/eval-tasks/register": {
-            "post": {
-                "responses": {
-                    "200": {
-                        "description": "OK"
-                    }
-                },
-                "tags": [
-                    "EvalTasks"
-                ],
-                "parameters": [
-                    {
-                        "name": "X-LlamaStack-Provider-Data",
-                        "in": "header",
-                        "description": "JSON-encoded provider data which will be made available to the adapter servicing the API",
-                        "required": false,
-                        "schema": {
-                            "type": "string"
-                        }
-                    },
-                    {
-                        "name": "X-LlamaStack-Client-Version",
-                        "in": "header",
-                        "description": "Version of the client making the request. This is used to ensure that the client and server are compatible.",
-                        "required": false,
-                        "schema": {
-                            "type": "string"
-                        }
-                    }
-                ],
-                "requestBody": {
-                    "content": {
-                        "application/json": {
-                            "schema": {
-                                "$ref": "#/components/schemas/RegisterEvalTaskRequest"
-                            }
-                        }
-                    },
-                    "required": true
-                }
-            }
-        },
-        "/v1/memory-banks/register": {
-            "post": {
-                "responses": {
-                    "200": {
-                        "description": "",
-                        "content": {
-                            "application/json": {
-                                "schema": {
-                                    "oneOf": [
-                                        {
-                                            "$ref": "#/components/schemas/VectorMemoryBank"
-                                        },
-                                        {
-                                            "$ref": "#/components/schemas/KeyValueMemoryBank"
-                                        },
-                                        {
-                                            "$ref": "#/components/schemas/KeywordMemoryBank"
-                                        },
-                                        {
-                                            "$ref": "#/components/schemas/GraphMemoryBank"
-                                        }
-                                    ]
-                                }
-                            }
-                        }
-                    }
-                },
-                "tags": [
-                    "MemoryBanks"
-                ],
-                "parameters": [
-                    {
-                        "name": "X-LlamaStack-Provider-Data",
-                        "in": "header",
-                        "description": "JSON-encoded provider data which will be made available to the adapter servicing the API",
-                        "required": false,
-                        "schema": {
-                            "type": "string"
-                        }
-                    },
-                    {
-                        "name": "X-LlamaStack-Client-Version",
-                        "in": "header",
-                        "description": "Version of the client making the request. This is used to ensure that the client and server are compatible.",
-                        "required": false,
-                        "schema": {
-                            "type": "string"
-                        }
-                    }
-                ],
-                "requestBody": {
-                    "content": {
-                        "application/json": {
-                            "schema": {
-                                "$ref": "#/components/schemas/RegisterMemoryBankRequest"
-                            }
-                        }
-                    },
-                    "required": true
-                }
-            }
-        },
-        "/v1/models/register": {
-            "post": {
-                "responses": {
-                    "200": {
-                        "description": "OK",
-                        "content": {
-                            "application/json": {
-                                "schema": {
-                                    "$ref": "#/components/schemas/Model"
-                                }
-                            }
-                        }
-                    }
-                },
-                "tags": [
-                    "Models"
-                ],
-                "parameters": [
-                    {
-                        "name": "X-LlamaStack-Provider-Data",
-                        "in": "header",
-                        "description": "JSON-encoded provider data which will be made available to the adapter servicing the API",
-                        "required": false,
-                        "schema": {
-                            "type": "string"
-                        }
-                    },
-                    {
-                        "name": "X-LlamaStack-Client-Version",
-                        "in": "header",
-                        "description": "Version of the client making the request. This is used to ensure that the client and server are compatible.",
-                        "required": false,
-                        "schema": {
-                            "type": "string"
-                        }
-                    }
-                ],
-                "requestBody": {
-                    "content": {
-                        "application/json": {
-                            "schema": {
-                                "$ref": "#/components/schemas/RegisterModelRequest"
-                            }
-                        }
-                    },
-                    "required": true
-                }
-            }
-        },
-        "/v1/scoring-functions/register": {
-            "post": {
-                "responses": {
-                    "200": {
-                        "description": "OK"
-                    }
-                },
-                "tags": [
-                    "ScoringFunctions"
-                ],
-                "parameters": [
-                    {
-                        "name": "X-LlamaStack-Provider-Data",
-                        "in": "header",
-                        "description": "JSON-encoded provider data which will be made available to the adapter servicing the API",
-                        "required": false,
-                        "schema": {
-                            "type": "string"
-                        }
-                    },
-                    {
-                        "name": "X-LlamaStack-Client-Version",
-                        "in": "header",
-                        "description": "Version of the client making the request. This is used to ensure that the client and server are compatible.",
-                        "required": false,
-                        "schema": {
-                            "type": "string"
-                        }
-                    }
-                ],
-                "requestBody": {
-                    "content": {
-                        "application/json": {
-                            "schema": {
-                                "$ref": "#/components/schemas/RegisterScoringFunctionRequest"
-                            }
-                        }
-                    },
-                    "required": true
-                }
-            }
-        },
-        "/v1/shields/register": {
-            "post": {
-                "responses": {
-                    "200": {
-                        "description": "OK",
-                        "content": {
-                            "application/json": {
-                                "schema": {
-                                    "$ref": "#/components/schemas/Shield"
-                                }
-                            }
-                        }
-                    }
-                },
-                "tags": [
-                    "Shields"
-                ],
-                "parameters": [
-                    {
-                        "name": "X-LlamaStack-Provider-Data",
-                        "in": "header",
-                        "description": "JSON-encoded provider data which will be made available to the adapter servicing the API",
-                        "required": false,
-                        "schema": {
-                            "type": "string"
-                        }
-                    },
-                    {
-                        "name": "X-LlamaStack-Client-Version",
-                        "in": "header",
-                        "description": "Version of the client making the request. This is used to ensure that the client and server are compatible.",
-                        "required": false,
-                        "schema": {
-                            "type": "string"
-                        }
-                    }
-                ],
-                "requestBody": {
-                    "content": {
-                        "application/json": {
-                            "schema": {
-                                "$ref": "#/components/schemas/RegisterShieldRequest"
-                            }
-                        }
-                    },
-                    "required": true
-                }
-            }
-        },
-        "/v1/toolgroups/register": {
-            "post": {
-                "responses": {
-                    "200": {
-                        "description": "OK"
-                    }
-                },
-                "tags": [
-                    "ToolGroups"
-                ],
-                "summary": "Register a tool group",
-                "parameters": [
-                    {
-                        "name": "X-LlamaStack-Provider-Data",
-                        "in": "header",
-                        "description": "JSON-encoded provider data which will be made available to the adapter servicing the API",
-                        "required": false,
-                        "schema": {
-                            "type": "string"
-                        }
-                    },
-                    {
-                        "name": "X-LlamaStack-Client-Version",
-                        "in": "header",
-                        "description": "Version of the client making the request. This is used to ensure that the client and server are compatible.",
-                        "required": false,
-                        "schema": {
-                            "type": "string"
-                        }
-                    }
-                ],
-                "requestBody": {
-                    "content": {
-                        "application/json": {
-                            "schema": {
-                                "$ref": "#/components/schemas/RegisterToolGroupRequest"
-                            }
-                        }
-                    },
-                    "required": true
-                }
-            }
-        },
-        "/v1/eval/run-eval": {
+        "/v1/eval/run": {
             "post": {
                 "responses": {
                     "200": {
@@ -3221,175 +3364,6 @@
                 }
             }
         },
-        "/v1/datasets/unregister": {
-            "post": {
-                "responses": {
-                    "200": {
-                        "description": "OK"
-                    }
-                },
-                "tags": [
-                    "Datasets"
-                ],
-                "parameters": [
-                    {
-                        "name": "X-LlamaStack-Provider-Data",
-                        "in": "header",
-                        "description": "JSON-encoded provider data which will be made available to the adapter servicing the API",
-                        "required": false,
-                        "schema": {
-                            "type": "string"
-                        }
-                    },
-                    {
-                        "name": "X-LlamaStack-Client-Version",
-                        "in": "header",
-                        "description": "Version of the client making the request. This is used to ensure that the client and server are compatible.",
-                        "required": false,
-                        "schema": {
-                            "type": "string"
-                        }
-                    }
-                ],
-                "requestBody": {
-                    "content": {
-                        "application/json": {
-                            "schema": {
-                                "$ref": "#/components/schemas/UnregisterDatasetRequest"
-                            }
-                        }
-                    },
-                    "required": true
-                }
-            }
-        },
-        "/v1/memory-banks/unregister": {
-            "post": {
-                "responses": {
-                    "200": {
-                        "description": "OK"
-                    }
-                },
-                "tags": [
-                    "MemoryBanks"
-                ],
-                "parameters": [
-                    {
-                        "name": "X-LlamaStack-Provider-Data",
-                        "in": "header",
-                        "description": "JSON-encoded provider data which will be made available to the adapter servicing the API",
-                        "required": false,
-                        "schema": {
-                            "type": "string"
-                        }
-                    },
-                    {
-                        "name": "X-LlamaStack-Client-Version",
-                        "in": "header",
-                        "description": "Version of the client making the request. This is used to ensure that the client and server are compatible.",
-                        "required": false,
-                        "schema": {
-                            "type": "string"
-                        }
-                    }
-                ],
-                "requestBody": {
-                    "content": {
-                        "application/json": {
-                            "schema": {
-                                "$ref": "#/components/schemas/UnregisterMemoryBankRequest"
-                            }
-                        }
-                    },
-                    "required": true
-                }
-            }
-        },
-        "/v1/models/unregister": {
-            "post": {
-                "responses": {
-                    "200": {
-                        "description": "OK"
-                    }
-                },
-                "tags": [
-                    "Models"
-                ],
-                "parameters": [
-                    {
-                        "name": "X-LlamaStack-Provider-Data",
-                        "in": "header",
-                        "description": "JSON-encoded provider data which will be made available to the adapter servicing the API",
-                        "required": false,
-                        "schema": {
-                            "type": "string"
-                        }
-                    },
-                    {
-                        "name": "X-LlamaStack-Client-Version",
-                        "in": "header",
-                        "description": "Version of the client making the request. This is used to ensure that the client and server are compatible.",
-                        "required": false,
-                        "schema": {
-                            "type": "string"
-                        }
-                    }
-                ],
-                "requestBody": {
-                    "content": {
-                        "application/json": {
-                            "schema": {
-                                "$ref": "#/components/schemas/UnregisterModelRequest"
-                            }
-                        }
-                    },
-                    "required": true
-                }
-            }
-        },
-        "/v1/toolgroups/unregister": {
-            "post": {
-                "responses": {
-                    "200": {
-                        "description": "OK"
-                    }
-                },
-                "tags": [
-                    "ToolGroups"
-                ],
-                "summary": "Unregister a tool group",
-                "parameters": [
-                    {
-                        "name": "X-LlamaStack-Provider-Data",
-                        "in": "header",
-                        "description": "JSON-encoded provider data which will be made available to the adapter servicing the API",
-                        "required": false,
-                        "schema": {
-                            "type": "string"
-                        }
-                    },
-                    {
-                        "name": "X-LlamaStack-Client-Version",
-                        "in": "header",
-                        "description": "Version of the client making the request. This is used to ensure that the client and server are compatible.",
-                        "required": false,
-                        "schema": {
-                            "type": "string"
-                        }
-                    }
-                ],
-                "requestBody": {
-                    "content": {
-                        "application/json": {
-                            "schema": {
-                                "$ref": "#/components/schemas/UnregisterToolGroupRequest"
-                            }
-                        }
-                    },
-                    "required": true
-                }
-            }
-        },
         "/v1/version": {
             "get": {
                 "responses": {
@@ -3512,6 +3486,20 @@
                     "tool_calls"
                 ]
             },
+            "GreedySamplingStrategy": {
+                "type": "object",
+                "properties": {
+                    "type": {
+                        "type": "string",
+                        "const": "greedy",
+                        "default": "greedy"
+                    }
+                },
+                "additionalProperties": false,
+                "required": [
+                    "type"
+                ]
+            },
             "ImageContentItem": {
                 "type": "object",
                 "properties": {
@@ -3579,20 +3567,17 @@
                 "type": "object",
                 "properties": {
                     "strategy": {
-                        "$ref": "#/components/schemas/SamplingStrategy",
-                        "default": "greedy"
-                    },
-                    "temperature": {
-                        "type": "number",
-                        "default": 0.0
-                    },
-                    "top_p": {
-                        "type": "number",
-                        "default": 0.95
-                    },
-                    "top_k": {
-                        "type": "integer",
-                        "default": 0
+                        "oneOf": [
+                            {
+                                "$ref": "#/components/schemas/GreedySamplingStrategy"
+                            },
+                            {
+                                "$ref": "#/components/schemas/TopPSamplingStrategy"
+                            },
+                            {
+                                "$ref": "#/components/schemas/TopKSamplingStrategy"
+                            }
+                        ]
                     },
                     "max_tokens": {
                         "type": "integer",
@@ -3608,14 +3593,6 @@
                     "strategy"
                 ]
             },
-            "SamplingStrategy": {
-                "type": "string",
-                "enum": [
-                    "greedy",
-                    "top_p",
-                    "top_k"
-                ]
-            },
             "StopReason": {
                 "type": "string",
                 "enum": [
@@ -3869,6 +3846,45 @@
                     "content"
                 ]
             },
+            "TopKSamplingStrategy": {
+                "type": "object",
+                "properties": {
+                    "type": {
+                        "type": "string",
+                        "const": "top_k",
+                        "default": "top_k"
+                    },
+                    "top_k": {
+                        "type": "integer"
+                    }
+                },
+                "additionalProperties": false,
+                "required": [
+                    "type",
+                    "top_k"
+                ]
+            },
+            "TopPSamplingStrategy": {
+                "type": "object",
+                "properties": {
+                    "type": {
+                        "type": "string",
+                        "const": "top_p",
+                        "default": "top_p"
+                    },
+                    "temperature": {
+                        "type": "number"
+                    },
+                    "top_p": {
+                        "type": "number",
+                        "default": 0.95
+                    }
+                },
+                "additionalProperties": false,
+                "required": [
+                    "type"
+                ]
+            },
             "URL": {
                 "type": "object",
                 "properties": {
@@ -4631,16 +4647,12 @@
             "CreateAgentSessionRequest": {
                 "type": "object",
                 "properties": {
-                    "agent_id": {
-                        "type": "string"
-                    },
                     "session_name": {
                         "type": "string"
                     }
                 },
                 "additionalProperties": false,
                 "required": [
-                    "agent_id",
                     "session_name"
                 ]
             },
@@ -4659,12 +4671,6 @@
             "CreateAgentTurnRequest": {
                 "type": "object",
                 "properties": {
-                    "agent_id": {
-                        "type": "string"
-                    },
-                    "session_id": {
-                        "type": "string"
-                    },
                     "messages": {
                         "type": "array",
                         "items": {
@@ -4725,8 +4731,6 @@
                 },
                 "additionalProperties": false,
                 "required": [
-                    "agent_id",
-                    "session_id",
                     "messages"
                 ]
             },
@@ -5266,34 +5270,6 @@
                     "error"
                 ]
             },
-            "DeleteAgentsRequest": {
-                "type": "object",
-                "properties": {
-                    "agent_id": {
-                        "type": "string"
-                    }
-                },
-                "additionalProperties": false,
-                "required": [
-                    "agent_id"
-                ]
-            },
-            "DeleteAgentsSessionRequest": {
-                "type": "object",
-                "properties": {
-                    "agent_id": {
-                        "type": "string"
-                    },
-                    "session_id": {
-                        "type": "string"
-                    }
-                },
-                "additionalProperties": false,
-                "required": [
-                    "agent_id",
-                    "session_id"
-                ]
-            },
             "EmbeddingsRequest": {
                 "type": "object",
                 "properties": {
@@ -5701,18 +5677,6 @@
                     "aggregated_results"
                 ]
             },
-            "GetAgentsSessionRequest": {
-                "type": "object",
-                "properties": {
-                    "turn_ids": {
-                        "type": "array",
-                        "items": {
-                            "type": "string"
-                        }
-                    }
-                },
-                "additionalProperties": false
-            },
             "GraphMemoryBank": {
                 "type": "object",
                 "properties": {
@@ -6431,85 +6395,6 @@
                 ],
                 "title": "A safety shield resource that can be used to check content"
             },
-            "GetSpanTreeRequest": {
-                "type": "object",
-                "properties": {
-                    "attributes_to_return": {
-                        "type": "array",
-                        "items": {
-                            "type": "string"
-                        }
-                    }
-                },
-                "additionalProperties": false
-            },
-            "SpanStatus": {
-                "type": "string",
-                "enum": [
-                    "ok",
-                    "error"
-                ]
-            },
-            "SpanWithStatus": {
-                "type": "object",
-                "properties": {
-                    "span_id": {
-                        "type": "string"
-                    },
-                    "trace_id": {
-                        "type": "string"
-                    },
-                    "parent_span_id": {
-                        "type": "string"
-                    },
-                    "name": {
-                        "type": "string"
-                    },
-                    "start_time": {
-                        "type": "string",
-                        "format": "date-time"
-                    },
-                    "end_time": {
-                        "type": "string",
-                        "format": "date-time"
-                    },
-                    "attributes": {
-                        "type": "object",
-                        "additionalProperties": {
-                            "oneOf": [
-                                {
-                                    "type": "null"
-                                },
-                                {
-                                    "type": "boolean"
-                                },
-                                {
-                                    "type": "number"
-                                },
-                                {
-                                    "type": "string"
-                                },
-                                {
-                                    "type": "array"
-                                },
-                                {
-                                    "type": "object"
-                                }
-                            ]
-                        }
-                    },
-                    "status": {
-                        "$ref": "#/components/schemas/SpanStatus"
-                    }
-                },
-                "additionalProperties": false,
-                "required": [
-                    "span_id",
-                    "trace_id",
-                    "name",
-                    "start_time"
-                ]
-            },
             "Tool": {
                 "type": "object",
                 "properties": {
@@ -6735,16 +6620,28 @@
                 ],
                 "title": "Status of a finetuning job."
             },
-            "PostTrainingJob": {
+            "ListPostTrainingJobsResponse": {
                 "type": "object",
                 "properties": {
-                    "job_uuid": {
-                        "type": "string"
+                    "data": {
+                        "type": "array",
+                        "items": {
+                            "type": "object",
+                            "properties": {
+                                "job_uuid": {
+                                    "type": "string"
+                                }
+                            },
+                            "additionalProperties": false,
+                            "required": [
+                                "job_uuid"
+                            ]
+                        }
                     }
                 },
                 "additionalProperties": false,
                 "required": [
-                    "job_uuid"
+                    "data"
                 ]
             },
             "HealthInfo": {
@@ -6901,17 +6798,77 @@
             "JobCancelRequest": {
                 "type": "object",
                 "properties": {
-                    "task_id": {
+                    "job_id": {
                         "type": "string"
                     },
-                    "job_id": {
+                    "task_id": {
                         "type": "string"
                     }
                 },
                 "additionalProperties": false,
                 "required": [
-                    "task_id",
-                    "job_id"
+                    "job_id",
+                    "task_id"
+                ]
+            },
+            "ListDatasetsResponse": {
+                "type": "object",
+                "properties": {
+                    "data": {
+                        "type": "array",
+                        "items": {
+                            "$ref": "#/components/schemas/Dataset"
+                        }
+                    }
+                },
+                "additionalProperties": false,
+                "required": [
+                    "data"
+                ]
+            },
+            "ListEvalTasksResponse": {
+                "type": "object",
+                "properties": {
+                    "data": {
+                        "type": "array",
+                        "items": {
+                            "$ref": "#/components/schemas/EvalTask"
+                        }
+                    }
+                },
+                "additionalProperties": false,
+                "required": [
+                    "data"
+                ]
+            },
+            "ListMemoryBanksResponse": {
+                "type": "object",
+                "properties": {
+                    "data": {
+                        "type": "array",
+                        "items": {
+                            "$ref": "#/components/schemas/MemoryBank"
+                        }
+                    }
+                },
+                "additionalProperties": false,
+                "required": [
+                    "data"
+                ]
+            },
+            "ListModelsResponse": {
+                "type": "object",
+                "properties": {
+                    "data": {
+                        "type": "array",
+                        "items": {
+                            "$ref": "#/components/schemas/Model"
+                        }
+                    }
+                },
+                "additionalProperties": false,
+                "required": [
+                    "data"
                 ]
             },
             "ProviderInfo": {
@@ -6930,6 +6887,21 @@
                     "provider_type"
                 ]
             },
+            "ListProvidersResponse": {
+                "type": "object",
+                "properties": {
+                    "data": {
+                        "type": "array",
+                        "items": {
+                            "$ref": "#/components/schemas/ProviderInfo"
+                        }
+                    }
+                },
+                "additionalProperties": false,
+                "required": [
+                    "data"
+                ]
+            },
             "RouteInfo": {
                 "type": "object",
                 "properties": {
@@ -6953,14 +6925,65 @@
                     "provider_types"
                 ]
             },
-            "ListRuntimeToolsRequest": {
+            "ListScoringFunctionsResponse": {
                 "type": "object",
                 "properties": {
-                    "mcp_endpoint": {
-                        "$ref": "#/components/schemas/URL"
+                    "data": {
+                        "type": "array",
+                        "items": {
+                            "$ref": "#/components/schemas/ScoringFn"
+                        }
                     }
                 },
-                "additionalProperties": false
+                "additionalProperties": false,
+                "required": [
+                    "data"
+                ]
+            },
+            "ListShieldsResponse": {
+                "type": "object",
+                "properties": {
+                    "data": {
+                        "type": "array",
+                        "items": {
+                            "$ref": "#/components/schemas/Shield"
+                        }
+                    }
+                },
+                "additionalProperties": false,
+                "required": [
+                    "data"
+                ]
+            },
+            "ListToolGroupsResponse": {
+                "type": "object",
+                "properties": {
+                    "data": {
+                        "type": "array",
+                        "items": {
+                            "$ref": "#/components/schemas/ToolGroup"
+                        }
+                    }
+                },
+                "additionalProperties": false,
+                "required": [
+                    "data"
+                ]
+            },
+            "ListToolsResponse": {
+                "type": "object",
+                "properties": {
+                    "data": {
+                        "type": "array",
+                        "items": {
+                            "$ref": "#/components/schemas/Tool"
+                        }
+                    }
+                },
+                "additionalProperties": false,
+                "required": [
+                    "data"
+                ]
             },
             "LogSeverity": {
                 "type": "string",
@@ -7083,6 +7106,13 @@
                     "name"
                 ]
             },
+            "SpanStatus": {
+                "type": "string",
+                "enum": [
+                    "ok",
+                    "error"
+                ]
+            },
             "StructuredLogEvent": {
                 "type": "object",
                 "properties": {
@@ -7467,6 +7497,18 @@
                     "logger_config"
                 ]
             },
+            "PostTrainingJob": {
+                "type": "object",
+                "properties": {
+                    "job_uuid": {
+                        "type": "string"
+                    }
+                },
+                "additionalProperties": false,
+                "required": [
+                    "job_uuid"
+                ]
+            },
             "QueryDocumentsRequest": {
                 "type": "object",
                 "properties": {
@@ -7547,6 +7589,87 @@
                     "scores"
                 ]
             },
+            "QuerySpanTreeRequest": {
+                "type": "object",
+                "properties": {
+                    "span_id": {
+                        "type": "string"
+                    },
+                    "attributes_to_return": {
+                        "type": "array",
+                        "items": {
+                            "type": "string"
+                        }
+                    },
+                    "max_depth": {
+                        "type": "integer"
+                    }
+                },
+                "additionalProperties": false,
+                "required": [
+                    "span_id"
+                ]
+            },
+            "SpanWithStatus": {
+                "type": "object",
+                "properties": {
+                    "span_id": {
+                        "type": "string"
+                    },
+                    "trace_id": {
+                        "type": "string"
+                    },
+                    "parent_span_id": {
+                        "type": "string"
+                    },
+                    "name": {
+                        "type": "string"
+                    },
+                    "start_time": {
+                        "type": "string",
+                        "format": "date-time"
+                    },
+                    "end_time": {
+                        "type": "string",
+                        "format": "date-time"
+                    },
+                    "attributes": {
+                        "type": "object",
+                        "additionalProperties": {
+                            "oneOf": [
+                                {
+                                    "type": "null"
+                                },
+                                {
+                                    "type": "boolean"
+                                },
+                                {
+                                    "type": "number"
+                                },
+                                {
+                                    "type": "string"
+                                },
+                                {
+                                    "type": "array"
+                                },
+                                {
+                                    "type": "object"
+                                }
+                            ]
+                        }
+                    },
+                    "status": {
+                        "$ref": "#/components/schemas/SpanStatus"
+                    }
+                },
+                "additionalProperties": false,
+                "required": [
+                    "span_id",
+                    "trace_id",
+                    "name",
+                    "start_time"
+                ]
+            },
             "QueryCondition": {
                 "type": "object",
                 "properties": {
@@ -8606,54 +8729,6 @@
                 ],
                 "title": "Response from the synthetic data generation. Batch of (prompt, response, score) tuples that pass the threshold."
             },
-            "UnregisterDatasetRequest": {
-                "type": "object",
-                "properties": {
-                    "dataset_id": {
-                        "type": "string"
-                    }
-                },
-                "additionalProperties": false,
-                "required": [
-                    "dataset_id"
-                ]
-            },
-            "UnregisterMemoryBankRequest": {
-                "type": "object",
-                "properties": {
-                    "memory_bank_id": {
-                        "type": "string"
-                    }
-                },
-                "additionalProperties": false,
-                "required": [
-                    "memory_bank_id"
-                ]
-            },
-            "UnregisterModelRequest": {
-                "type": "object",
-                "properties": {
-                    "model_id": {
-                        "type": "string"
-                    }
-                },
-                "additionalProperties": false,
-                "required": [
-                    "model_id"
-                ]
-            },
-            "UnregisterToolGroupRequest": {
-                "type": "object",
-                "properties": {
-                    "tool_group_id": {
-                        "type": "string"
-                    }
-                },
-                "additionalProperties": false,
-                "required": [
-                    "tool_group_id"
-                ]
-            },
             "VersionInfo": {
                 "type": "object",
                 "properties": {
@@ -8855,14 +8930,6 @@
         {
             "name": "Datasets"
         },
-        {
-            "name": "DeleteAgentsRequest",
-            "description": "<SchemaDefinition schemaRef=\"#/components/schemas/DeleteAgentsRequest\" />"
-        },
-        {
-            "name": "DeleteAgentsSessionRequest",
-            "description": "<SchemaDefinition schemaRef=\"#/components/schemas/DeleteAgentsSessionRequest\" />"
-        },
         {
             "name": "EfficiencyConfig",
             "description": "<SchemaDefinition schemaRef=\"#/components/schemas/EfficiencyConfig\" />"
@@ -8893,14 +8960,6 @@
             "name": "EvaluateRowsRequest",
             "description": "<SchemaDefinition schemaRef=\"#/components/schemas/EvaluateRowsRequest\" />"
         },
-        {
-            "name": "GetAgentsSessionRequest",
-            "description": "<SchemaDefinition schemaRef=\"#/components/schemas/GetAgentsSessionRequest\" />"
-        },
-        {
-            "name": "GetSpanTreeRequest",
-            "description": "<SchemaDefinition schemaRef=\"#/components/schemas/GetSpanTreeRequest\" />"
-        },
         {
             "name": "GraphMemoryBank",
             "description": "<SchemaDefinition schemaRef=\"#/components/schemas/GraphMemoryBank\" />"
@@ -8909,6 +8968,10 @@
             "name": "GraphMemoryBankParams",
             "description": "<SchemaDefinition schemaRef=\"#/components/schemas/GraphMemoryBankParams\" />"
         },
+        {
+            "name": "GreedySamplingStrategy",
+            "description": "<SchemaDefinition schemaRef=\"#/components/schemas/GreedySamplingStrategy\" />"
+        },
         {
             "name": "HealthInfo",
             "description": "<SchemaDefinition schemaRef=\"#/components/schemas/HealthInfo\" />"
@@ -8980,8 +9043,44 @@
             "description": "<SchemaDefinition schemaRef=\"#/components/schemas/LLMAsJudgeScoringFnParams\" />"
         },
         {
-            "name": "ListRuntimeToolsRequest",
-            "description": "<SchemaDefinition schemaRef=\"#/components/schemas/ListRuntimeToolsRequest\" />"
+            "name": "ListDatasetsResponse",
+            "description": "<SchemaDefinition schemaRef=\"#/components/schemas/ListDatasetsResponse\" />"
+        },
+        {
+            "name": "ListEvalTasksResponse",
+            "description": "<SchemaDefinition schemaRef=\"#/components/schemas/ListEvalTasksResponse\" />"
+        },
+        {
+            "name": "ListMemoryBanksResponse",
+            "description": "<SchemaDefinition schemaRef=\"#/components/schemas/ListMemoryBanksResponse\" />"
+        },
+        {
+            "name": "ListModelsResponse",
+            "description": "<SchemaDefinition schemaRef=\"#/components/schemas/ListModelsResponse\" />"
+        },
+        {
+            "name": "ListPostTrainingJobsResponse",
+            "description": "<SchemaDefinition schemaRef=\"#/components/schemas/ListPostTrainingJobsResponse\" />"
+        },
+        {
+            "name": "ListProvidersResponse",
+            "description": "<SchemaDefinition schemaRef=\"#/components/schemas/ListProvidersResponse\" />"
+        },
+        {
+            "name": "ListScoringFunctionsResponse",
+            "description": "<SchemaDefinition schemaRef=\"#/components/schemas/ListScoringFunctionsResponse\" />"
+        },
+        {
+            "name": "ListShieldsResponse",
+            "description": "<SchemaDefinition schemaRef=\"#/components/schemas/ListShieldsResponse\" />"
+        },
+        {
+            "name": "ListToolGroupsResponse",
+            "description": "<SchemaDefinition schemaRef=\"#/components/schemas/ListToolGroupsResponse\" />"
+        },
+        {
+            "name": "ListToolsResponse",
+            "description": "<SchemaDefinition schemaRef=\"#/components/schemas/ListToolsResponse\" />"
         },
         {
             "name": "LogEventRequest",
@@ -9095,6 +9194,10 @@
             "name": "QueryDocumentsResponse",
             "description": "<SchemaDefinition schemaRef=\"#/components/schemas/QueryDocumentsResponse\" />"
         },
+        {
+            "name": "QuerySpanTreeRequest",
+            "description": "<SchemaDefinition schemaRef=\"#/components/schemas/QuerySpanTreeRequest\" />"
+        },
         {
             "name": "QuerySpansRequest",
             "description": "<SchemaDefinition schemaRef=\"#/components/schemas/QuerySpansRequest\" />"
@@ -9166,10 +9269,6 @@
             "name": "SamplingParams",
             "description": "<SchemaDefinition schemaRef=\"#/components/schemas/SamplingParams\" />"
         },
-        {
-            "name": "SamplingStrategy",
-            "description": "<SchemaDefinition schemaRef=\"#/components/schemas/SamplingStrategy\" />"
-        },
         {
             "name": "SaveSpansToDatasetRequest",
             "description": "<SchemaDefinition schemaRef=\"#/components/schemas/SaveSpansToDatasetRequest\" />"
@@ -9351,6 +9450,14 @@
         {
             "name": "ToolRuntime"
         },
+        {
+            "name": "TopKSamplingStrategy",
+            "description": "<SchemaDefinition schemaRef=\"#/components/schemas/TopKSamplingStrategy\" />"
+        },
+        {
+            "name": "TopPSamplingStrategy",
+            "description": "<SchemaDefinition schemaRef=\"#/components/schemas/TopPSamplingStrategy\" />"
+        },
         {
             "name": "Trace",
             "description": "<SchemaDefinition schemaRef=\"#/components/schemas/Trace\" />"
@@ -9367,22 +9474,6 @@
             "name": "URL",
             "description": "<SchemaDefinition schemaRef=\"#/components/schemas/URL\" />"
         },
-        {
-            "name": "UnregisterDatasetRequest",
-            "description": "<SchemaDefinition schemaRef=\"#/components/schemas/UnregisterDatasetRequest\" />"
-        },
-        {
-            "name": "UnregisterMemoryBankRequest",
-            "description": "<SchemaDefinition schemaRef=\"#/components/schemas/UnregisterMemoryBankRequest\" />"
-        },
-        {
-            "name": "UnregisterModelRequest",
-            "description": "<SchemaDefinition schemaRef=\"#/components/schemas/UnregisterModelRequest\" />"
-        },
-        {
-            "name": "UnregisterToolGroupRequest",
-            "description": "<SchemaDefinition schemaRef=\"#/components/schemas/UnregisterToolGroupRequest\" />"
-        },
         {
             "name": "UnstructuredLogEvent",
             "description": "<SchemaDefinition schemaRef=\"#/components/schemas/UnstructuredLogEvent\" />"
@@ -9479,18 +9570,15 @@
                 "DataConfig",
                 "Dataset",
                 "DatasetFormat",
-                "DeleteAgentsRequest",
-                "DeleteAgentsSessionRequest",
                 "EfficiencyConfig",
                 "EmbeddingsRequest",
                 "EmbeddingsResponse",
                 "EvalTask",
                 "EvaluateResponse",
                 "EvaluateRowsRequest",
-                "GetAgentsSessionRequest",
-                "GetSpanTreeRequest",
                 "GraphMemoryBank",
                 "GraphMemoryBankParams",
+                "GreedySamplingStrategy",
                 "HealthInfo",
                 "ImageContentItem",
                 "ImageDelta",
@@ -9507,7 +9595,16 @@
                 "KeywordMemoryBank",
                 "KeywordMemoryBankParams",
                 "LLMAsJudgeScoringFnParams",
-                "ListRuntimeToolsRequest",
+                "ListDatasetsResponse",
+                "ListEvalTasksResponse",
+                "ListMemoryBanksResponse",
+                "ListModelsResponse",
+                "ListPostTrainingJobsResponse",
+                "ListProvidersResponse",
+                "ListScoringFunctionsResponse",
+                "ListShieldsResponse",
+                "ListToolGroupsResponse",
+                "ListToolsResponse",
                 "LogEventRequest",
                 "LogSeverity",
                 "LoraFinetuningConfig",
@@ -9533,6 +9630,7 @@
                 "QueryConditionOp",
                 "QueryDocumentsRequest",
                 "QueryDocumentsResponse",
+                "QuerySpanTreeRequest",
                 "QuerySpansRequest",
                 "QueryTracesRequest",
                 "RegexParserScoringFnParams",
@@ -9550,7 +9648,6 @@
                 "RunShieldResponse",
                 "SafetyViolation",
                 "SamplingParams",
-                "SamplingStrategy",
                 "SaveSpansToDatasetRequest",
                 "ScoreBatchRequest",
                 "ScoreBatchResponse",
@@ -9591,14 +9688,12 @@
                 "ToolPromptFormat",
                 "ToolResponse",
                 "ToolResponseMessage",
+                "TopKSamplingStrategy",
+                "TopPSamplingStrategy",
                 "Trace",
                 "TrainingConfig",
                 "Turn",
                 "URL",
-                "UnregisterDatasetRequest",
-                "UnregisterMemoryBankRequest",
-                "UnregisterModelRequest",
-                "UnregisterToolGroupRequest",
                 "UnstructuredLogEvent",
                 "UserMessage",
                 "VectorMemoryBank",
diff --git a/docs/resources/llama-stack-spec.yaml b/docs/resources/llama-stack-spec.yaml
index 2afb8e375..ab27e4f3d 100644
--- a/docs/resources/llama-stack-spec.yaml
+++ b/docs/resources/llama-stack-spec.yaml
@@ -584,19 +584,14 @@ components:
     CreateAgentSessionRequest:
       additionalProperties: false
       properties:
-        agent_id:
-          type: string
         session_name:
           type: string
       required:
-      - agent_id
       - session_name
       type: object
     CreateAgentTurnRequest:
       additionalProperties: false
       properties:
-        agent_id:
-          type: string
         documents:
           items:
             additionalProperties: false
@@ -622,8 +617,6 @@ components:
             - $ref: '#/components/schemas/UserMessage'
             - $ref: '#/components/schemas/ToolResponseMessage'
           type: array
-        session_id:
-          type: string
         stream:
           type: boolean
         toolgroups:
@@ -631,8 +624,6 @@ components:
             $ref: '#/components/schemas/AgentTool'
           type: array
       required:
-      - agent_id
-      - session_id
       - messages
       type: object
     DPOAlignmentConfig:
@@ -720,25 +711,6 @@ components:
       - instruct
       - dialog
       type: string
-    DeleteAgentsRequest:
-      additionalProperties: false
-      properties:
-        agent_id:
-          type: string
-      required:
-      - agent_id
-      type: object
-    DeleteAgentsSessionRequest:
-      additionalProperties: false
-      properties:
-        agent_id:
-          type: string
-        session_id:
-          type: string
-      required:
-      - agent_id
-      - session_id
-      type: object
     EfficiencyConfig:
       additionalProperties: false
       properties:
@@ -872,22 +844,6 @@ components:
       - scoring_functions
       - task_config
       type: object
-    GetAgentsSessionRequest:
-      additionalProperties: false
-      properties:
-        turn_ids:
-          items:
-            type: string
-          type: array
-      type: object
-    GetSpanTreeRequest:
-      additionalProperties: false
-      properties:
-        attributes_to_return:
-          items:
-            type: string
-          type: array
-      type: object
     GraphMemoryBank:
       additionalProperties: false
       properties:
@@ -922,6 +878,16 @@ components:
       required:
       - memory_bank_type
       type: object
+    GreedySamplingStrategy:
+      additionalProperties: false
+      properties:
+        type:
+          const: greedy
+          default: greedy
+          type: string
+      required:
+      - type
+      type: object
     HealthInfo:
       additionalProperties: false
       properties:
@@ -1045,8 +1011,8 @@ components:
         task_id:
           type: string
       required:
-      - task_id
       - job_id
+      - task_id
       type: object
     JobStatus:
       enum:
@@ -1146,11 +1112,111 @@ components:
       - type
       - judge_model
       type: object
-    ListRuntimeToolsRequest:
+    ListDatasetsResponse:
       additionalProperties: false
       properties:
-        mcp_endpoint:
-          $ref: '#/components/schemas/URL'
+        data:
+          items:
+            $ref: '#/components/schemas/Dataset'
+          type: array
+      required:
+      - data
+      type: object
+    ListEvalTasksResponse:
+      additionalProperties: false
+      properties:
+        data:
+          items:
+            $ref: '#/components/schemas/EvalTask'
+          type: array
+      required:
+      - data
+      type: object
+    ListMemoryBanksResponse:
+      additionalProperties: false
+      properties:
+        data:
+          items:
+            $ref: '#/components/schemas/MemoryBank'
+          type: array
+      required:
+      - data
+      type: object
+    ListModelsResponse:
+      additionalProperties: false
+      properties:
+        data:
+          items:
+            $ref: '#/components/schemas/Model'
+          type: array
+      required:
+      - data
+      type: object
+    ListPostTrainingJobsResponse:
+      additionalProperties: false
+      properties:
+        data:
+          items:
+            additionalProperties: false
+            properties:
+              job_uuid:
+                type: string
+            required:
+            - job_uuid
+            type: object
+          type: array
+      required:
+      - data
+      type: object
+    ListProvidersResponse:
+      additionalProperties: false
+      properties:
+        data:
+          items:
+            $ref: '#/components/schemas/ProviderInfo'
+          type: array
+      required:
+      - data
+      type: object
+    ListScoringFunctionsResponse:
+      additionalProperties: false
+      properties:
+        data:
+          items:
+            $ref: '#/components/schemas/ScoringFn'
+          type: array
+      required:
+      - data
+      type: object
+    ListShieldsResponse:
+      additionalProperties: false
+      properties:
+        data:
+          items:
+            $ref: '#/components/schemas/Shield'
+          type: array
+      required:
+      - data
+      type: object
+    ListToolGroupsResponse:
+      additionalProperties: false
+      properties:
+        data:
+          items:
+            $ref: '#/components/schemas/ToolGroup'
+          type: array
+      required:
+      - data
+      type: object
+    ListToolsResponse:
+      additionalProperties: false
+      properties:
+        data:
+          items:
+            $ref: '#/components/schemas/Tool'
+          type: array
+      required:
+      - data
       type: object
     LogEventRequest:
       additionalProperties: false
@@ -1715,6 +1781,20 @@ components:
       - chunks
       - scores
       type: object
+    QuerySpanTreeRequest:
+      additionalProperties: false
+      properties:
+        attributes_to_return:
+          items:
+            type: string
+          type: array
+        max_depth:
+          type: integer
+        span_id:
+          type: string
+      required:
+      - span_id
+      type: object
     QuerySpansRequest:
       additionalProperties: false
       properties:
@@ -2069,26 +2149,13 @@ components:
           default: 1.0
           type: number
         strategy:
-          $ref: '#/components/schemas/SamplingStrategy'
-          default: greedy
-        temperature:
-          default: 0.0
-          type: number
-        top_k:
-          default: 0
-          type: integer
-        top_p:
-          default: 0.95
-          type: number
+          oneOf:
+          - $ref: '#/components/schemas/GreedySamplingStrategy'
+          - $ref: '#/components/schemas/TopPSamplingStrategy'
+          - $ref: '#/components/schemas/TopKSamplingStrategy'
       required:
       - strategy
       type: object
-    SamplingStrategy:
-      enum:
-      - greedy
-      - top_p
-      - top_k
-      type: string
     SaveSpansToDatasetRequest:
       additionalProperties: false
       properties:
@@ -2945,6 +3012,34 @@ components:
       - tool_name
       - content
       type: object
+    TopKSamplingStrategy:
+      additionalProperties: false
+      properties:
+        top_k:
+          type: integer
+        type:
+          const: top_k
+          default: top_k
+          type: string
+      required:
+      - type
+      - top_k
+      type: object
+    TopPSamplingStrategy:
+      additionalProperties: false
+      properties:
+        temperature:
+          type: number
+        top_p:
+          default: 0.95
+          type: number
+        type:
+          const: top_p
+          default: top_p
+          type: string
+      required:
+      - type
+      type: object
     Trace:
       additionalProperties: false
       properties:
@@ -3057,38 +3152,6 @@ components:
       required:
       - uri
       type: object
-    UnregisterDatasetRequest:
-      additionalProperties: false
-      properties:
-        dataset_id:
-          type: string
-      required:
-      - dataset_id
-      type: object
-    UnregisterMemoryBankRequest:
-      additionalProperties: false
-      properties:
-        memory_bank_id:
-          type: string
-      required:
-      - memory_bank_id
-      type: object
-    UnregisterModelRequest:
-      additionalProperties: false
-      properties:
-        model_id:
-          type: string
-      required:
-      - model_id
-      type: object
-    UnregisterToolGroupRequest:
-      additionalProperties: false
-      properties:
-        tool_group_id:
-          type: string
-      required:
-      - tool_group_id
-      type: object
     UnstructuredLogEvent:
       additionalProperties: false
       properties:
@@ -3216,7 +3279,7 @@ info:
 jsonSchemaDialect: https://json-schema.org/draft/2020-12/schema
 openapi: 3.1.0
 paths:
-  /v1/agents/create:
+  /v1/agents:
     post:
       parameters:
       - description: JSON-encoded provider data which will be made available to the
@@ -3248,9 +3311,14 @@ paths:
           description: OK
       tags:
       - Agents
-  /v1/agents/delete:
-    post:
+  /v1/agents/{agent_id}:
+    delete:
       parameters:
+      - in: path
+        name: agent_id
+        required: true
+        schema:
+          type: string
       - description: JSON-encoded provider data which will be made available to the
           adapter servicing the API
         in: header
@@ -3265,20 +3333,19 @@ paths:
         required: false
         schema:
           type: string
-      requestBody:
-        content:
-          application/json:
-            schema:
-              $ref: '#/components/schemas/DeleteAgentsRequest'
-        required: true
       responses:
         '200':
           description: OK
       tags:
       - Agents
-  /v1/agents/session/create:
+  /v1/agents/{agent_id}/session:
     post:
       parameters:
+      - in: path
+        name: agent_id
+        required: true
+        schema:
+          type: string
       - description: JSON-encoded provider data which will be made available to the
           adapter servicing the API
         in: header
@@ -3308,9 +3375,19 @@ paths:
           description: OK
       tags:
       - Agents
-  /v1/agents/session/delete:
-    post:
+  /v1/agents/{agent_id}/session/{session_id}:
+    delete:
       parameters:
+      - in: path
+        name: session_id
+        required: true
+        schema:
+          type: string
+      - in: path
+        name: agent_id
+        required: true
+        schema:
+          type: string
       - description: JSON-encoded provider data which will be made available to the
           adapter servicing the API
         in: header
@@ -3325,30 +3402,30 @@ paths:
         required: false
         schema:
           type: string
-      requestBody:
-        content:
-          application/json:
-            schema:
-              $ref: '#/components/schemas/DeleteAgentsSessionRequest'
-        required: true
       responses:
         '200':
           description: OK
       tags:
       - Agents
-  /v1/agents/session/get:
-    post:
+    get:
       parameters:
-      - in: query
+      - in: path
+        name: session_id
+        required: true
+        schema:
+          type: string
+      - in: path
         name: agent_id
         required: true
         schema:
           type: string
       - in: query
-        name: session_id
-        required: true
+        name: turn_ids
+        required: false
         schema:
-          type: string
+          items:
+            type: string
+          type: array
       - description: JSON-encoded provider data which will be made available to the
           adapter servicing the API
         in: header
@@ -3363,12 +3440,6 @@ paths:
         required: false
         schema:
           type: string
-      requestBody:
-        content:
-          application/json:
-            schema:
-              $ref: '#/components/schemas/GetAgentsSessionRequest'
-        required: true
       responses:
         '200':
           content:
@@ -3378,55 +3449,19 @@ paths:
           description: OK
       tags:
       - Agents
-  /v1/agents/step/get:
-    get:
+  /v1/agents/{agent_id}/session/{session_id}/turn:
+    post:
       parameters:
-      - in: query
+      - in: path
         name: agent_id
         required: true
         schema:
           type: string
-      - in: query
+      - in: path
         name: session_id
         required: true
         schema:
           type: string
-      - in: query
-        name: turn_id
-        required: true
-        schema:
-          type: string
-      - in: query
-        name: step_id
-        required: true
-        schema:
-          type: string
-      - description: JSON-encoded provider data which will be made available to the
-          adapter servicing the API
-        in: header
-        name: X-LlamaStack-Provider-Data
-        required: false
-        schema:
-          type: string
-      - description: Version of the client making the request. This is used to ensure
-          that the client and server are compatible.
-        in: header
-        name: X-LlamaStack-Client-Version
-        required: false
-        schema:
-          type: string
-      responses:
-        '200':
-          content:
-            application/json:
-              schema:
-                $ref: '#/components/schemas/AgentStepResponse'
-          description: OK
-      tags:
-      - Agents
-  /v1/agents/turn/create:
-    post:
-      parameters:
       - description: JSON-encoded provider data which will be made available to the
           adapter servicing the API
         in: header
@@ -3459,20 +3494,20 @@ paths:
             streamed agent turn completion response.
       tags:
       - Agents
-  /v1/agents/turn/get:
+  /v1/agents/{agent_id}/session/{session_id}/turn/{turn_id}:
     get:
       parameters:
-      - in: query
+      - in: path
         name: agent_id
         required: true
         schema:
           type: string
-      - in: query
+      - in: path
         name: session_id
         required: true
         schema:
           type: string
-      - in: query
+      - in: path
         name: turn_id
         required: true
         schema:
@@ -3500,6 +3535,52 @@ paths:
           description: OK
       tags:
       - Agents
+  /v1/agents/{agent_id}/session/{session_id}/turn/{turn_id}/step/{step_id}:
+    get:
+      parameters:
+      - in: path
+        name: agent_id
+        required: true
+        schema:
+          type: string
+      - in: path
+        name: session_id
+        required: true
+        schema:
+          type: string
+      - in: path
+        name: turn_id
+        required: true
+        schema:
+          type: string
+      - in: path
+        name: step_id
+        required: true
+        schema:
+          type: string
+      - description: JSON-encoded provider data which will be made available to the
+          adapter servicing the API
+        in: header
+        name: X-LlamaStack-Provider-Data
+        required: false
+        schema:
+          type: string
+      - description: Version of the client making the request. This is used to ensure
+          that the client and server are compatible.
+        in: header
+        name: X-LlamaStack-Client-Version
+        required: false
+        schema:
+          type: string
+      responses:
+        '200':
+          content:
+            application/json:
+              schema:
+                $ref: '#/components/schemas/AgentStepResponse'
+          description: OK
+      tags:
+      - Agents
   /v1/batch-inference/chat-completion:
     post:
       parameters:
@@ -3564,35 +3645,7 @@ paths:
           description: OK
       tags:
       - BatchInference (Coming Soon)
-  /v1/datasetio/append-rows:
-    post:
-      parameters:
-      - description: JSON-encoded provider data which will be made available to the
-          adapter servicing the API
-        in: header
-        name: X-LlamaStack-Provider-Data
-        required: false
-        schema:
-          type: string
-      - description: Version of the client making the request. This is used to ensure
-          that the client and server are compatible.
-        in: header
-        name: X-LlamaStack-Client-Version
-        required: false
-        schema:
-          type: string
-      requestBody:
-        content:
-          application/json:
-            schema:
-              $ref: '#/components/schemas/AppendRowsRequest'
-        required: true
-      responses:
-        '200':
-          description: OK
-      tags:
-      - DatasetIO
-  /v1/datasetio/get-rows-paginated:
+  /v1/datasetio/rows:
     get:
       parameters:
       - in: query
@@ -3638,10 +3691,116 @@ paths:
           description: OK
       tags:
       - DatasetIO
-  /v1/datasets/get:
+    post:
+      parameters:
+      - description: JSON-encoded provider data which will be made available to the
+          adapter servicing the API
+        in: header
+        name: X-LlamaStack-Provider-Data
+        required: false
+        schema:
+          type: string
+      - description: Version of the client making the request. This is used to ensure
+          that the client and server are compatible.
+        in: header
+        name: X-LlamaStack-Client-Version
+        required: false
+        schema:
+          type: string
+      requestBody:
+        content:
+          application/json:
+            schema:
+              $ref: '#/components/schemas/AppendRowsRequest'
+        required: true
+      responses:
+        '200':
+          description: OK
+      tags:
+      - DatasetIO
+  /v1/datasets:
     get:
       parameters:
-      - in: query
+      - description: JSON-encoded provider data which will be made available to the
+          adapter servicing the API
+        in: header
+        name: X-LlamaStack-Provider-Data
+        required: false
+        schema:
+          type: string
+      - description: Version of the client making the request. This is used to ensure
+          that the client and server are compatible.
+        in: header
+        name: X-LlamaStack-Client-Version
+        required: false
+        schema:
+          type: string
+      responses:
+        '200':
+          content:
+            application/json:
+              schema:
+                $ref: '#/components/schemas/ListDatasetsResponse'
+          description: OK
+      tags:
+      - Datasets
+    post:
+      parameters:
+      - description: JSON-encoded provider data which will be made available to the
+          adapter servicing the API
+        in: header
+        name: X-LlamaStack-Provider-Data
+        required: false
+        schema:
+          type: string
+      - description: Version of the client making the request. This is used to ensure
+          that the client and server are compatible.
+        in: header
+        name: X-LlamaStack-Client-Version
+        required: false
+        schema:
+          type: string
+      requestBody:
+        content:
+          application/json:
+            schema:
+              $ref: '#/components/schemas/RegisterDatasetRequest'
+        required: true
+      responses:
+        '200':
+          description: OK
+      tags:
+      - Datasets
+  /v1/datasets/{dataset_id}:
+    delete:
+      parameters:
+      - in: path
+        name: dataset_id
+        required: true
+        schema:
+          type: string
+      - description: JSON-encoded provider data which will be made available to the
+          adapter servicing the API
+        in: header
+        name: X-LlamaStack-Provider-Data
+        required: false
+        schema:
+          type: string
+      - description: Version of the client making the request. This is used to ensure
+          that the client and server are compatible.
+        in: header
+        name: X-LlamaStack-Client-Version
+        required: false
+        schema:
+          type: string
+      responses:
+        '200':
+          description: OK
+      tags:
+      - Datasets
+    get:
+      parameters:
+      - in: path
         name: dataset_id
         required: true
         schema:
@@ -3671,7 +3830,7 @@ paths:
           description: OK
       tags:
       - Datasets
-  /v1/datasets/list:
+  /v1/eval-tasks:
     get:
       parameters:
       - description: JSON-encoded provider data which will be made available to the
@@ -3691,13 +3850,12 @@ paths:
       responses:
         '200':
           content:
-            application/jsonl:
+            application/json:
               schema:
-                $ref: '#/components/schemas/Dataset'
+                $ref: '#/components/schemas/ListEvalTasksResponse'
           description: OK
       tags:
-      - Datasets
-  /v1/datasets/register:
+      - EvalTasks
     post:
       parameters:
       - description: JSON-encoded provider data which will be made available to the
@@ -3718,46 +3876,18 @@ paths:
         content:
           application/json:
             schema:
-              $ref: '#/components/schemas/RegisterDatasetRequest'
+              $ref: '#/components/schemas/RegisterEvalTaskRequest'
         required: true
       responses:
         '200':
           description: OK
       tags:
-      - Datasets
-  /v1/datasets/unregister:
-    post:
-      parameters:
-      - description: JSON-encoded provider data which will be made available to the
-          adapter servicing the API
-        in: header
-        name: X-LlamaStack-Provider-Data
-        required: false
-        schema:
-          type: string
-      - description: Version of the client making the request. This is used to ensure
-          that the client and server are compatible.
-        in: header
-        name: X-LlamaStack-Client-Version
-        required: false
-        schema:
-          type: string
-      requestBody:
-        content:
-          application/json:
-            schema:
-              $ref: '#/components/schemas/UnregisterDatasetRequest'
-        required: true
-      responses:
-        '200':
-          description: OK
-      tags:
-      - Datasets
-  /v1/eval-tasks/get:
+      - EvalTasks
+  /v1/eval-tasks/{eval_task_id}:
     get:
       parameters:
-      - in: query
-        name: name
+      - in: path
+        name: eval_task_id
         required: true
         schema:
           type: string
@@ -3786,60 +3916,6 @@ paths:
           description: OK
       tags:
       - EvalTasks
-  /v1/eval-tasks/list:
-    get:
-      parameters:
-      - description: JSON-encoded provider data which will be made available to the
-          adapter servicing the API
-        in: header
-        name: X-LlamaStack-Provider-Data
-        required: false
-        schema:
-          type: string
-      - description: Version of the client making the request. This is used to ensure
-          that the client and server are compatible.
-        in: header
-        name: X-LlamaStack-Client-Version
-        required: false
-        schema:
-          type: string
-      responses:
-        '200':
-          content:
-            application/jsonl:
-              schema:
-                $ref: '#/components/schemas/EvalTask'
-          description: OK
-      tags:
-      - EvalTasks
-  /v1/eval-tasks/register:
-    post:
-      parameters:
-      - description: JSON-encoded provider data which will be made available to the
-          adapter servicing the API
-        in: header
-        name: X-LlamaStack-Provider-Data
-        required: false
-        schema:
-          type: string
-      - description: Version of the client making the request. This is used to ensure
-          that the client and server are compatible.
-        in: header
-        name: X-LlamaStack-Client-Version
-        required: false
-        schema:
-          type: string
-      requestBody:
-        content:
-          application/json:
-            schema:
-              $ref: '#/components/schemas/RegisterEvalTaskRequest'
-        required: true
-      responses:
-        '200':
-          description: OK
-      tags:
-      - EvalTasks
   /v1/eval/evaluate-rows:
     post:
       parameters:
@@ -3872,7 +3948,7 @@ paths:
           description: OK
       tags:
       - Eval
-  /v1/eval/job/cancel:
+  /v1/eval/jobs/cancel:
     post:
       parameters:
       - description: JSON-encoded provider data which will be made available to the
@@ -3900,55 +3976,19 @@ paths:
           description: OK
       tags:
       - Eval
-  /v1/eval/job/result:
+  /v1/eval/jobs/{job_id}:
     get:
       parameters:
-      - in: query
-        name: task_id
-        required: true
-        schema:
-          type: string
-      - in: query
+      - in: path
         name: job_id
         required: true
         schema:
           type: string
-      - description: JSON-encoded provider data which will be made available to the
-          adapter servicing the API
-        in: header
-        name: X-LlamaStack-Provider-Data
-        required: false
-        schema:
-          type: string
-      - description: Version of the client making the request. This is used to ensure
-          that the client and server are compatible.
-        in: header
-        name: X-LlamaStack-Client-Version
-        required: false
-        schema:
-          type: string
-      responses:
-        '200':
-          content:
-            application/json:
-              schema:
-                $ref: '#/components/schemas/EvaluateResponse'
-          description: OK
-      tags:
-      - Eval
-  /v1/eval/job/status:
-    get:
-      parameters:
       - in: query
         name: task_id
         required: true
         schema:
           type: string
-      - in: query
-        name: job_id
-        required: true
-        schema:
-          type: string
       - description: JSON-encoded provider data which will be made available to the
           adapter servicing the API
         in: header
@@ -3974,7 +4014,43 @@ paths:
           description: OK
       tags:
       - Eval
-  /v1/eval/run-eval:
+  /v1/eval/jobs/{job_id}/result:
+    get:
+      parameters:
+      - in: path
+        name: job_id
+        required: true
+        schema:
+          type: string
+      - in: query
+        name: task_id
+        required: true
+        schema:
+          type: string
+      - description: JSON-encoded provider data which will be made available to the
+          adapter servicing the API
+        in: header
+        name: X-LlamaStack-Provider-Data
+        required: false
+        schema:
+          type: string
+      - description: Version of the client making the request. This is used to ensure
+          that the client and server are compatible.
+        in: header
+        name: X-LlamaStack-Client-Version
+        required: false
+        schema:
+          type: string
+      responses:
+        '200':
+          content:
+            application/json:
+              schema:
+                $ref: '#/components/schemas/EvaluateResponse'
+          description: OK
+      tags:
+      - Eval
+  /v1/eval/run:
     post:
       parameters:
       - description: JSON-encoded provider data which will be made available to the
@@ -4132,14 +4208,9 @@ paths:
           description: OK
       tags:
       - Inference
-  /v1/memory-banks/get:
+  /v1/memory-banks:
     get:
       parameters:
-      - in: query
-        name: memory_bank_id
-        required: true
-        schema:
-          type: string
       - description: JSON-encoded provider data which will be made available to the
           adapter servicing the API
         in: header
@@ -4159,39 +4230,10 @@ paths:
           content:
             application/json:
               schema:
-                oneOf:
-                - $ref: '#/components/schemas/MemoryBank'
-                - type: 'null'
+                $ref: '#/components/schemas/ListMemoryBanksResponse'
           description: OK
       tags:
       - MemoryBanks
-  /v1/memory-banks/list:
-    get:
-      parameters:
-      - description: JSON-encoded provider data which will be made available to the
-          adapter servicing the API
-        in: header
-        name: X-LlamaStack-Provider-Data
-        required: false
-        schema:
-          type: string
-      - description: Version of the client making the request. This is used to ensure
-          that the client and server are compatible.
-        in: header
-        name: X-LlamaStack-Client-Version
-        required: false
-        schema:
-          type: string
-      responses:
-        '200':
-          content:
-            application/jsonl:
-              schema:
-                $ref: '#/components/schemas/MemoryBank'
-          description: OK
-      tags:
-      - MemoryBanks
-  /v1/memory-banks/register:
     post:
       parameters:
       - description: JSON-encoded provider data which will be made available to the
@@ -4227,9 +4269,14 @@ paths:
           description: ''
       tags:
       - MemoryBanks
-  /v1/memory-banks/unregister:
-    post:
+  /v1/memory-banks/{memory_bank_id}:
+    delete:
       parameters:
+      - in: path
+        name: memory_bank_id
+        required: true
+        schema:
+          type: string
       - description: JSON-encoded provider data which will be made available to the
           adapter servicing the API
         in: header
@@ -4244,17 +4291,43 @@ paths:
         required: false
         schema:
           type: string
-      requestBody:
-        content:
-          application/json:
-            schema:
-              $ref: '#/components/schemas/UnregisterMemoryBankRequest'
-        required: true
       responses:
         '200':
           description: OK
       tags:
       - MemoryBanks
+    get:
+      parameters:
+      - in: path
+        name: memory_bank_id
+        required: true
+        schema:
+          type: string
+      - description: JSON-encoded provider data which will be made available to the
+          adapter servicing the API
+        in: header
+        name: X-LlamaStack-Provider-Data
+        required: false
+        schema:
+          type: string
+      - description: Version of the client making the request. This is used to ensure
+          that the client and server are compatible.
+        in: header
+        name: X-LlamaStack-Client-Version
+        required: false
+        schema:
+          type: string
+      responses:
+        '200':
+          content:
+            application/json:
+              schema:
+                oneOf:
+                - $ref: '#/components/schemas/MemoryBank'
+                - type: 'null'
+          description: OK
+      tags:
+      - MemoryBanks
   /v1/memory/insert:
     post:
       parameters:
@@ -4315,14 +4388,9 @@ paths:
           description: OK
       tags:
       - Memory
-  /v1/models/get:
+  /v1/models:
     get:
       parameters:
-      - in: query
-        name: identifier
-        required: true
-        schema:
-          type: string
       - description: JSON-encoded provider data which will be made available to the
           adapter servicing the API
         in: header
@@ -4342,39 +4410,10 @@ paths:
           content:
             application/json:
               schema:
-                oneOf:
-                - $ref: '#/components/schemas/Model'
-                - type: 'null'
+                $ref: '#/components/schemas/ListModelsResponse'
           description: OK
       tags:
       - Models
-  /v1/models/list:
-    get:
-      parameters:
-      - description: JSON-encoded provider data which will be made available to the
-          adapter servicing the API
-        in: header
-        name: X-LlamaStack-Provider-Data
-        required: false
-        schema:
-          type: string
-      - description: Version of the client making the request. This is used to ensure
-          that the client and server are compatible.
-        in: header
-        name: X-LlamaStack-Client-Version
-        required: false
-        schema:
-          type: string
-      responses:
-        '200':
-          content:
-            application/jsonl:
-              schema:
-                $ref: '#/components/schemas/Model'
-          description: OK
-      tags:
-      - Models
-  /v1/models/register:
     post:
       parameters:
       - description: JSON-encoded provider data which will be made available to the
@@ -4406,9 +4445,14 @@ paths:
           description: OK
       tags:
       - Models
-  /v1/models/unregister:
-    post:
+  /v1/models/{model_id}:
+    delete:
       parameters:
+      - in: path
+        name: model_id
+        required: true
+        schema:
+          type: string
       - description: JSON-encoded provider data which will be made available to the
           adapter servicing the API
         in: header
@@ -4423,17 +4467,43 @@ paths:
         required: false
         schema:
           type: string
-      requestBody:
-        content:
-          application/json:
-            schema:
-              $ref: '#/components/schemas/UnregisterModelRequest'
-        required: true
       responses:
         '200':
           description: OK
       tags:
       - Models
+    get:
+      parameters:
+      - in: path
+        name: model_id
+        required: true
+        schema:
+          type: string
+      - description: JSON-encoded provider data which will be made available to the
+          adapter servicing the API
+        in: header
+        name: X-LlamaStack-Provider-Data
+        required: false
+        schema:
+          type: string
+      - description: Version of the client making the request. This is used to ensure
+          that the client and server are compatible.
+        in: header
+        name: X-LlamaStack-Client-Version
+        required: false
+        schema:
+          type: string
+      responses:
+        '200':
+          content:
+            application/json:
+              schema:
+                oneOf:
+                - $ref: '#/components/schemas/Model'
+                - type: 'null'
+          description: OK
+      tags:
+      - Models
   /v1/post-training/job/artifacts:
     get:
       parameters:
@@ -4548,9 +4618,9 @@ paths:
       responses:
         '200':
           content:
-            application/jsonl:
+            application/json:
               schema:
-                $ref: '#/components/schemas/PostTrainingJob'
+                $ref: '#/components/schemas/ListPostTrainingJobsResponse'
           description: OK
       tags:
       - PostTraining (Coming Soon)
@@ -4640,9 +4710,7 @@ paths:
           content:
             application/json:
               schema:
-                additionalProperties:
-                  $ref: '#/components/schemas/ProviderInfo'
-                type: object
+                $ref: '#/components/schemas/ListProvidersResponse'
           description: OK
       tags:
       - Inspect
@@ -4708,10 +4776,63 @@ paths:
           description: OK
       tags:
       - Safety
-  /v1/scoring-functions/get:
+  /v1/scoring-functions:
     get:
       parameters:
-      - in: query
+      - description: JSON-encoded provider data which will be made available to the
+          adapter servicing the API
+        in: header
+        name: X-LlamaStack-Provider-Data
+        required: false
+        schema:
+          type: string
+      - description: Version of the client making the request. This is used to ensure
+          that the client and server are compatible.
+        in: header
+        name: X-LlamaStack-Client-Version
+        required: false
+        schema:
+          type: string
+      responses:
+        '200':
+          content:
+            application/json:
+              schema:
+                $ref: '#/components/schemas/ListScoringFunctionsResponse'
+          description: OK
+      tags:
+      - ScoringFunctions
+    post:
+      parameters:
+      - description: JSON-encoded provider data which will be made available to the
+          adapter servicing the API
+        in: header
+        name: X-LlamaStack-Provider-Data
+        required: false
+        schema:
+          type: string
+      - description: Version of the client making the request. This is used to ensure
+          that the client and server are compatible.
+        in: header
+        name: X-LlamaStack-Client-Version
+        required: false
+        schema:
+          type: string
+      requestBody:
+        content:
+          application/json:
+            schema:
+              $ref: '#/components/schemas/RegisterScoringFunctionRequest'
+        required: true
+      responses:
+        '200':
+          description: OK
+      tags:
+      - ScoringFunctions
+  /v1/scoring-functions/{scoring_fn_id}:
+    get:
+      parameters:
+      - in: path
         name: scoring_fn_id
         required: true
         schema:
@@ -4741,60 +4862,6 @@ paths:
           description: OK
       tags:
       - ScoringFunctions
-  /v1/scoring-functions/list:
-    get:
-      parameters:
-      - description: JSON-encoded provider data which will be made available to the
-          adapter servicing the API
-        in: header
-        name: X-LlamaStack-Provider-Data
-        required: false
-        schema:
-          type: string
-      - description: Version of the client making the request. This is used to ensure
-          that the client and server are compatible.
-        in: header
-        name: X-LlamaStack-Client-Version
-        required: false
-        schema:
-          type: string
-      responses:
-        '200':
-          content:
-            application/jsonl:
-              schema:
-                $ref: '#/components/schemas/ScoringFn'
-          description: OK
-      tags:
-      - ScoringFunctions
-  /v1/scoring-functions/register:
-    post:
-      parameters:
-      - description: JSON-encoded provider data which will be made available to the
-          adapter servicing the API
-        in: header
-        name: X-LlamaStack-Provider-Data
-        required: false
-        schema:
-          type: string
-      - description: Version of the client making the request. This is used to ensure
-          that the client and server are compatible.
-        in: header
-        name: X-LlamaStack-Client-Version
-        required: false
-        schema:
-          type: string
-      requestBody:
-        content:
-          application/json:
-            schema:
-              $ref: '#/components/schemas/RegisterScoringFunctionRequest'
-        required: true
-      responses:
-        '200':
-          description: OK
-      tags:
-      - ScoringFunctions
   /v1/scoring/score:
     post:
       parameters:
@@ -4859,14 +4926,9 @@ paths:
           description: OK
       tags:
       - Scoring
-  /v1/shields/get:
+  /v1/shields:
     get:
       parameters:
-      - in: query
-        name: identifier
-        required: true
-        schema:
-          type: string
       - description: JSON-encoded provider data which will be made available to the
           adapter servicing the API
         in: header
@@ -4886,39 +4948,10 @@ paths:
           content:
             application/json:
               schema:
-                oneOf:
-                - $ref: '#/components/schemas/Shield'
-                - type: 'null'
+                $ref: '#/components/schemas/ListShieldsResponse'
           description: OK
       tags:
       - Shields
-  /v1/shields/list:
-    get:
-      parameters:
-      - description: JSON-encoded provider data which will be made available to the
-          adapter servicing the API
-        in: header
-        name: X-LlamaStack-Provider-Data
-        required: false
-        schema:
-          type: string
-      - description: Version of the client making the request. This is used to ensure
-          that the client and server are compatible.
-        in: header
-        name: X-LlamaStack-Client-Version
-        required: false
-        schema:
-          type: string
-      responses:
-        '200':
-          content:
-            application/jsonl:
-              schema:
-                $ref: '#/components/schemas/Shield'
-          description: OK
-      tags:
-      - Shields
-  /v1/shields/register:
     post:
       parameters:
       - description: JSON-encoded provider data which will be made available to the
@@ -4950,6 +4983,39 @@ paths:
           description: OK
       tags:
       - Shields
+  /v1/shields/{identifier}:
+    get:
+      parameters:
+      - in: path
+        name: identifier
+        required: true
+        schema:
+          type: string
+      - description: JSON-encoded provider data which will be made available to the
+          adapter servicing the API
+        in: header
+        name: X-LlamaStack-Provider-Data
+        required: false
+        schema:
+          type: string
+      - description: Version of the client making the request. This is used to ensure
+          that the client and server are compatible.
+        in: header
+        name: X-LlamaStack-Client-Version
+        required: false
+        schema:
+          type: string
+      responses:
+        '200':
+          content:
+            application/json:
+              schema:
+                oneOf:
+                - $ref: '#/components/schemas/Shield'
+                - type: 'null'
+          description: OK
+      tags:
+      - Shields
   /v1/synthetic-data-generation/generate:
     post:
       parameters:
@@ -4982,50 +5048,6 @@ paths:
           description: OK
       tags:
       - SyntheticDataGeneration (Coming Soon)
-  /v1/telemetry/get-span-tree:
-    post:
-      parameters:
-      - in: query
-        name: span_id
-        required: true
-        schema:
-          type: string
-      - in: query
-        name: max_depth
-        required: false
-        schema:
-          type: integer
-      - description: JSON-encoded provider data which will be made available to the
-          adapter servicing the API
-        in: header
-        name: X-LlamaStack-Provider-Data
-        required: false
-        schema:
-          type: string
-      - description: Version of the client making the request. This is used to ensure
-          that the client and server are compatible.
-        in: header
-        name: X-LlamaStack-Client-Version
-        required: false
-        schema:
-          type: string
-      requestBody:
-        content:
-          application/json:
-            schema:
-              $ref: '#/components/schemas/GetSpanTreeRequest'
-        required: true
-      responses:
-        '200':
-          content:
-            application/json:
-              schema:
-                additionalProperties:
-                  $ref: '#/components/schemas/SpanWithStatus'
-                type: object
-          description: OK
-      tags:
-      - Telemetry
   /v1/telemetry/log-event:
     post:
       parameters:
@@ -5054,6 +5076,40 @@ paths:
           description: OK
       tags:
       - Telemetry
+  /v1/telemetry/query-span-tree:
+    post:
+      parameters:
+      - description: JSON-encoded provider data which will be made available to the
+          adapter servicing the API
+        in: header
+        name: X-LlamaStack-Provider-Data
+        required: false
+        schema:
+          type: string
+      - description: Version of the client making the request. This is used to ensure
+          that the client and server are compatible.
+        in: header
+        name: X-LlamaStack-Client-Version
+        required: false
+        schema:
+          type: string
+      requestBody:
+        content:
+          application/json:
+            schema:
+              $ref: '#/components/schemas/QuerySpanTreeRequest'
+        required: true
+      responses:
+        '200':
+          content:
+            application/json:
+              schema:
+                additionalProperties:
+                  $ref: '#/components/schemas/SpanWithStatus'
+                type: object
+          description: OK
+      tags:
+      - Telemetry
   /v1/telemetry/query-spans:
     post:
       parameters:
@@ -5180,13 +5236,18 @@ paths:
       tags:
       - ToolRuntime
   /v1/tool-runtime/list-tools:
-    post:
+    get:
       parameters:
       - in: query
         name: tool_group_id
         required: false
         schema:
           type: string
+      - in: query
+        name: mcp_endpoint
+        required: false
+        schema:
+          $ref: '#/components/schemas/URL'
       - description: JSON-encoded provider data which will be made available to the
           adapter servicing the API
         in: header
@@ -5201,12 +5262,6 @@ paths:
         required: false
         schema:
           type: string
-      requestBody:
-        content:
-          application/json:
-            schema:
-              $ref: '#/components/schemas/ListRuntimeToolsRequest'
-        required: true
       responses:
         '200':
           content:
@@ -5216,14 +5271,9 @@ paths:
           description: OK
       tags:
       - ToolRuntime
-  /v1/toolgroups/get:
+  /v1/toolgroups:
     get:
       parameters:
-      - in: query
-        name: toolgroup_id
-        required: true
-        schema:
-          type: string
       - description: JSON-encoded provider data which will be made available to the
           adapter servicing the API
         in: header
@@ -5243,38 +5293,11 @@ paths:
           content:
             application/json:
               schema:
-                $ref: '#/components/schemas/ToolGroup'
-          description: OK
-      tags:
-      - ToolGroups
-  /v1/toolgroups/list:
-    get:
-      parameters:
-      - description: JSON-encoded provider data which will be made available to the
-          adapter servicing the API
-        in: header
-        name: X-LlamaStack-Provider-Data
-        required: false
-        schema:
-          type: string
-      - description: Version of the client making the request. This is used to ensure
-          that the client and server are compatible.
-        in: header
-        name: X-LlamaStack-Client-Version
-        required: false
-        schema:
-          type: string
-      responses:
-        '200':
-          content:
-            application/jsonl:
-              schema:
-                $ref: '#/components/schemas/ToolGroup'
+                $ref: '#/components/schemas/ListToolGroupsResponse'
           description: OK
       summary: List tool groups with optional provider
       tags:
       - ToolGroups
-  /v1/toolgroups/register:
     post:
       parameters:
       - description: JSON-encoded provider data which will be made available to the
@@ -5303,9 +5326,14 @@ paths:
       summary: Register a tool group
       tags:
       - ToolGroups
-  /v1/toolgroups/unregister:
-    post:
+  /v1/toolgroups/{toolgroup_id}:
+    delete:
       parameters:
+      - in: path
+        name: toolgroup_id
+        required: true
+        schema:
+          type: string
       - description: JSON-encoded provider data which will be made available to the
           adapter servicing the API
         in: header
@@ -5320,22 +5348,78 @@ paths:
         required: false
         schema:
           type: string
-      requestBody:
-        content:
-          application/json:
-            schema:
-              $ref: '#/components/schemas/UnregisterToolGroupRequest'
-        required: true
       responses:
         '200':
           description: OK
       summary: Unregister a tool group
       tags:
       - ToolGroups
-  /v1/tools/get:
+    get:
+      parameters:
+      - in: path
+        name: toolgroup_id
+        required: true
+        schema:
+          type: string
+      - description: JSON-encoded provider data which will be made available to the
+          adapter servicing the API
+        in: header
+        name: X-LlamaStack-Provider-Data
+        required: false
+        schema:
+          type: string
+      - description: Version of the client making the request. This is used to ensure
+          that the client and server are compatible.
+        in: header
+        name: X-LlamaStack-Client-Version
+        required: false
+        schema:
+          type: string
+      responses:
+        '200':
+          content:
+            application/json:
+              schema:
+                $ref: '#/components/schemas/ToolGroup'
+          description: OK
+      tags:
+      - ToolGroups
+  /v1/tools:
     get:
       parameters:
       - in: query
+        name: toolgroup_id
+        required: false
+        schema:
+          type: string
+      - description: JSON-encoded provider data which will be made available to the
+          adapter servicing the API
+        in: header
+        name: X-LlamaStack-Provider-Data
+        required: false
+        schema:
+          type: string
+      - description: Version of the client making the request. This is used to ensure
+          that the client and server are compatible.
+        in: header
+        name: X-LlamaStack-Client-Version
+        required: false
+        schema:
+          type: string
+      responses:
+        '200':
+          content:
+            application/json:
+              schema:
+                $ref: '#/components/schemas/ListToolsResponse'
+          description: OK
+      summary: List tools with optional tool group
+      tags:
+      - ToolGroups
+  /v1/tools/{tool_name}:
+    get:
+      parameters:
+      - in: path
         name: tool_name
         required: true
         schema:
@@ -5363,38 +5447,6 @@ paths:
           description: OK
       tags:
       - ToolGroups
-  /v1/tools/list:
-    get:
-      parameters:
-      - in: query
-        name: tool_group_id
-        required: false
-        schema:
-          type: string
-      - description: JSON-encoded provider data which will be made available to the
-          adapter servicing the API
-        in: header
-        name: X-LlamaStack-Provider-Data
-        required: false
-        schema:
-          type: string
-      - description: Version of the client making the request. This is used to ensure
-          that the client and server are compatible.
-        in: header
-        name: X-LlamaStack-Client-Version
-        required: false
-        schema:
-          type: string
-      responses:
-        '200':
-          content:
-            application/jsonl:
-              schema:
-                $ref: '#/components/schemas/Tool'
-          description: OK
-      summary: List tools with optional tool group
-      tags:
-      - ToolGroups
   /v1/version:
     get:
       parameters:
@@ -5568,12 +5620,6 @@ tags:
   name: DatasetFormat
 - name: DatasetIO
 - name: Datasets
-- description: <SchemaDefinition schemaRef="#/components/schemas/DeleteAgentsRequest"
-    />
-  name: DeleteAgentsRequest
-- description: <SchemaDefinition schemaRef="#/components/schemas/DeleteAgentsSessionRequest"
-    />
-  name: DeleteAgentsSessionRequest
 - description: <SchemaDefinition schemaRef="#/components/schemas/EfficiencyConfig"
     />
   name: EfficiencyConfig
@@ -5593,18 +5639,15 @@ tags:
 - description: <SchemaDefinition schemaRef="#/components/schemas/EvaluateRowsRequest"
     />
   name: EvaluateRowsRequest
-- description: <SchemaDefinition schemaRef="#/components/schemas/GetAgentsSessionRequest"
-    />
-  name: GetAgentsSessionRequest
-- description: <SchemaDefinition schemaRef="#/components/schemas/GetSpanTreeRequest"
-    />
-  name: GetSpanTreeRequest
 - description: <SchemaDefinition schemaRef="#/components/schemas/GraphMemoryBank"
     />
   name: GraphMemoryBank
 - description: <SchemaDefinition schemaRef="#/components/schemas/GraphMemoryBankParams"
     />
   name: GraphMemoryBankParams
+- description: <SchemaDefinition schemaRef="#/components/schemas/GreedySamplingStrategy"
+    />
+  name: GreedySamplingStrategy
 - description: <SchemaDefinition schemaRef="#/components/schemas/HealthInfo" />
   name: HealthInfo
 - description: <SchemaDefinition schemaRef="#/components/schemas/ImageContentItem"
@@ -5650,9 +5693,36 @@ tags:
 - description: <SchemaDefinition schemaRef="#/components/schemas/LLMAsJudgeScoringFnParams"
     />
   name: LLMAsJudgeScoringFnParams
-- description: <SchemaDefinition schemaRef="#/components/schemas/ListRuntimeToolsRequest"
+- description: <SchemaDefinition schemaRef="#/components/schemas/ListDatasetsResponse"
     />
-  name: ListRuntimeToolsRequest
+  name: ListDatasetsResponse
+- description: <SchemaDefinition schemaRef="#/components/schemas/ListEvalTasksResponse"
+    />
+  name: ListEvalTasksResponse
+- description: <SchemaDefinition schemaRef="#/components/schemas/ListMemoryBanksResponse"
+    />
+  name: ListMemoryBanksResponse
+- description: <SchemaDefinition schemaRef="#/components/schemas/ListModelsResponse"
+    />
+  name: ListModelsResponse
+- description: <SchemaDefinition schemaRef="#/components/schemas/ListPostTrainingJobsResponse"
+    />
+  name: ListPostTrainingJobsResponse
+- description: <SchemaDefinition schemaRef="#/components/schemas/ListProvidersResponse"
+    />
+  name: ListProvidersResponse
+- description: <SchemaDefinition schemaRef="#/components/schemas/ListScoringFunctionsResponse"
+    />
+  name: ListScoringFunctionsResponse
+- description: <SchemaDefinition schemaRef="#/components/schemas/ListShieldsResponse"
+    />
+  name: ListShieldsResponse
+- description: <SchemaDefinition schemaRef="#/components/schemas/ListToolGroupsResponse"
+    />
+  name: ListToolGroupsResponse
+- description: <SchemaDefinition schemaRef="#/components/schemas/ListToolsResponse"
+    />
+  name: ListToolsResponse
 - description: <SchemaDefinition schemaRef="#/components/schemas/LogEventRequest"
     />
   name: LogEventRequest
@@ -5727,6 +5797,9 @@ tags:
 - description: <SchemaDefinition schemaRef="#/components/schemas/QueryDocumentsResponse"
     />
   name: QueryDocumentsResponse
+- description: <SchemaDefinition schemaRef="#/components/schemas/QuerySpanTreeRequest"
+    />
+  name: QuerySpanTreeRequest
 - description: <SchemaDefinition schemaRef="#/components/schemas/QuerySpansRequest"
     />
   name: QuerySpansRequest
@@ -5775,9 +5848,6 @@ tags:
   name: SafetyViolation
 - description: <SchemaDefinition schemaRef="#/components/schemas/SamplingParams" />
   name: SamplingParams
-- description: <SchemaDefinition schemaRef="#/components/schemas/SamplingStrategy"
-    />
-  name: SamplingStrategy
 - description: <SchemaDefinition schemaRef="#/components/schemas/SaveSpansToDatasetRequest"
     />
   name: SaveSpansToDatasetRequest
@@ -5898,6 +5968,12 @@ tags:
     />
   name: ToolResponseMessage
 - name: ToolRuntime
+- description: <SchemaDefinition schemaRef="#/components/schemas/TopKSamplingStrategy"
+    />
+  name: TopKSamplingStrategy
+- description: <SchemaDefinition schemaRef="#/components/schemas/TopPSamplingStrategy"
+    />
+  name: TopPSamplingStrategy
 - description: <SchemaDefinition schemaRef="#/components/schemas/Trace" />
   name: Trace
 - description: <SchemaDefinition schemaRef="#/components/schemas/TrainingConfig" />
@@ -5909,18 +5985,6 @@ tags:
   name: Turn
 - description: <SchemaDefinition schemaRef="#/components/schemas/URL" />
   name: URL
-- description: <SchemaDefinition schemaRef="#/components/schemas/UnregisterDatasetRequest"
-    />
-  name: UnregisterDatasetRequest
-- description: <SchemaDefinition schemaRef="#/components/schemas/UnregisterMemoryBankRequest"
-    />
-  name: UnregisterMemoryBankRequest
-- description: <SchemaDefinition schemaRef="#/components/schemas/UnregisterModelRequest"
-    />
-  name: UnregisterModelRequest
-- description: <SchemaDefinition schemaRef="#/components/schemas/UnregisterToolGroupRequest"
-    />
-  name: UnregisterToolGroupRequest
 - description: <SchemaDefinition schemaRef="#/components/schemas/UnstructuredLogEvent"
     />
   name: UnstructuredLogEvent
@@ -6003,18 +6067,15 @@ x-tagGroups:
   - DataConfig
   - Dataset
   - DatasetFormat
-  - DeleteAgentsRequest
-  - DeleteAgentsSessionRequest
   - EfficiencyConfig
   - EmbeddingsRequest
   - EmbeddingsResponse
   - EvalTask
   - EvaluateResponse
   - EvaluateRowsRequest
-  - GetAgentsSessionRequest
-  - GetSpanTreeRequest
   - GraphMemoryBank
   - GraphMemoryBankParams
+  - GreedySamplingStrategy
   - HealthInfo
   - ImageContentItem
   - ImageDelta
@@ -6031,7 +6092,16 @@ x-tagGroups:
   - KeywordMemoryBank
   - KeywordMemoryBankParams
   - LLMAsJudgeScoringFnParams
-  - ListRuntimeToolsRequest
+  - ListDatasetsResponse
+  - ListEvalTasksResponse
+  - ListMemoryBanksResponse
+  - ListModelsResponse
+  - ListPostTrainingJobsResponse
+  - ListProvidersResponse
+  - ListScoringFunctionsResponse
+  - ListShieldsResponse
+  - ListToolGroupsResponse
+  - ListToolsResponse
   - LogEventRequest
   - LogSeverity
   - LoraFinetuningConfig
@@ -6057,6 +6127,7 @@ x-tagGroups:
   - QueryConditionOp
   - QueryDocumentsRequest
   - QueryDocumentsResponse
+  - QuerySpanTreeRequest
   - QuerySpansRequest
   - QueryTracesRequest
   - RegexParserScoringFnParams
@@ -6074,7 +6145,6 @@ x-tagGroups:
   - RunShieldResponse
   - SafetyViolation
   - SamplingParams
-  - SamplingStrategy
   - SaveSpansToDatasetRequest
   - ScoreBatchRequest
   - ScoreBatchResponse
@@ -6115,14 +6185,12 @@ x-tagGroups:
   - ToolPromptFormat
   - ToolResponse
   - ToolResponseMessage
+  - TopKSamplingStrategy
+  - TopPSamplingStrategy
   - Trace
   - TrainingConfig
   - Turn
   - URL
-  - UnregisterDatasetRequest
-  - UnregisterMemoryBankRequest
-  - UnregisterModelRequest
-  - UnregisterToolGroupRequest
   - UnstructuredLogEvent
   - UserMessage
   - VectorMemoryBank
diff --git a/llama_stack/apis/agents/agents.py b/llama_stack/apis/agents/agents.py
index c3f3d21f0..63d0920fb 100644
--- a/llama_stack/apis/agents/agents.py
+++ b/llama_stack/apis/agents/agents.py
@@ -7,6 +7,7 @@
 from datetime import datetime
 from enum import Enum
 from typing import (
+    Annotated,
     Any,
     AsyncIterator,
     Dict,
@@ -20,7 +21,6 @@ from typing import (
 
 from llama_models.schema_utils import json_schema_type, register_schema, webmethod
 from pydantic import BaseModel, ConfigDict, Field
-from typing_extensions import Annotated
 
 from llama_stack.apis.common.content_types import ContentDelta, InterleavedContent, URL
 from llama_stack.apis.inference import (
@@ -296,13 +296,13 @@ class AgentStepResponse(BaseModel):
 @runtime_checkable
 @trace_protocol
 class Agents(Protocol):
-    @webmethod(route="/agents/create")
+    @webmethod(route="/agents", method="POST")
     async def create_agent(
         self,
         agent_config: AgentConfig,
     ) -> AgentCreateResponse: ...
 
-    @webmethod(route="/agents/turn/create")
+    @webmethod(route="/agents/{agent_id}/session/{session_id}/turn", method="POST")
     async def create_agent_turn(
         self,
         agent_id: str,
@@ -318,36 +318,52 @@ class Agents(Protocol):
         toolgroups: Optional[List[AgentToolGroup]] = None,
     ) -> Union[Turn, AsyncIterator[AgentTurnResponseStreamChunk]]: ...
 
-    @webmethod(route="/agents/turn/get")
+    @webmethod(
+        route="/agents/{agent_id}/session/{session_id}/turn/{turn_id}", method="GET"
+    )
     async def get_agents_turn(
-        self, agent_id: str, session_id: str, turn_id: str
+        self,
+        agent_id: str,
+        session_id: str,
+        turn_id: str,
     ) -> Turn: ...
 
-    @webmethod(route="/agents/step/get")
+    @webmethod(
+        route="/agents/{agent_id}/session/{session_id}/turn/{turn_id}/step/{step_id}",
+        method="GET",
+    )
     async def get_agents_step(
-        self, agent_id: str, session_id: str, turn_id: str, step_id: str
+        self,
+        agent_id: str,
+        session_id: str,
+        turn_id: str,
+        step_id: str,
     ) -> AgentStepResponse: ...
 
-    @webmethod(route="/agents/session/create")
+    @webmethod(route="/agents/{agent_id}/session", method="POST")
     async def create_agent_session(
         self,
         agent_id: str,
         session_name: str,
     ) -> AgentSessionCreateResponse: ...
 
-    @webmethod(route="/agents/session/get")
+    @webmethod(route="/agents/{agent_id}/session/{session_id}", method="GET")
     async def get_agents_session(
         self,
-        agent_id: str,
         session_id: str,
+        agent_id: str,
         turn_ids: Optional[List[str]] = None,
     ) -> Session: ...
 
-    @webmethod(route="/agents/session/delete")
-    async def delete_agents_session(self, agent_id: str, session_id: str) -> None: ...
+    @webmethod(route="/agents/{agent_id}/session/{session_id}", method="DELETE")
+    async def delete_agents_session(
+        self,
+        session_id: str,
+        agent_id: str,
+    ) -> None: ...
 
-    @webmethod(route="/agents/delete")
-    async def delete_agents(
+    @webmethod(route="/agents/{agent_id}", method="DELETE")
+    async def delete_agent(
         self,
         agent_id: str,
     ) -> None: ...
diff --git a/llama_stack/apis/batch_inference/batch_inference.py b/llama_stack/apis/batch_inference/batch_inference.py
index 81826a7b1..ca5ba059f 100644
--- a/llama_stack/apis/batch_inference/batch_inference.py
+++ b/llama_stack/apis/batch_inference/batch_inference.py
@@ -54,7 +54,7 @@ class BatchChatCompletionResponse(BaseModel):
 
 @runtime_checkable
 class BatchInference(Protocol):
-    @webmethod(route="/batch-inference/completion")
+    @webmethod(route="/batch-inference/completion", method="POST")
     async def batch_completion(
         self,
         model: str,
@@ -63,7 +63,7 @@ class BatchInference(Protocol):
         logprobs: Optional[LogProbConfig] = None,
     ) -> BatchCompletionResponse: ...
 
-    @webmethod(route="/batch-inference/chat-completion")
+    @webmethod(route="/batch-inference/chat-completion", method="POST")
     async def batch_chat_completion(
         self,
         model: str,
diff --git a/llama_stack/apis/datasetio/datasetio.py b/llama_stack/apis/datasetio/datasetio.py
index 983e0e4ea..8b4c25a1d 100644
--- a/llama_stack/apis/datasetio/datasetio.py
+++ b/llama_stack/apis/datasetio/datasetio.py
@@ -29,7 +29,7 @@ class DatasetIO(Protocol):
     # keeping for aligning with inference/safety, but this is not used
     dataset_store: DatasetStore
 
-    @webmethod(route="/datasetio/get-rows-paginated", method="GET")
+    @webmethod(route="/datasetio/rows", method="GET")
     async def get_rows_paginated(
         self,
         dataset_id: str,
@@ -38,7 +38,7 @@ class DatasetIO(Protocol):
         filter_condition: Optional[str] = None,
     ) -> PaginatedRowsResult: ...
 
-    @webmethod(route="/datasetio/append-rows", method="POST")
+    @webmethod(route="/datasetio/rows", method="POST")
     async def append_rows(
         self, dataset_id: str, rows: List[Dict[str, Any]]
     ) -> None: ...
diff --git a/llama_stack/apis/datasets/datasets.py b/llama_stack/apis/datasets/datasets.py
index 7afc0f8fd..5ad5bdcdb 100644
--- a/llama_stack/apis/datasets/datasets.py
+++ b/llama_stack/apis/datasets/datasets.py
@@ -7,11 +7,9 @@
 from typing import Any, Dict, List, Literal, Optional, Protocol
 
 from llama_models.schema_utils import json_schema_type, webmethod
-
 from pydantic import BaseModel, Field
 
 from llama_stack.apis.common.content_types import URL
-
 from llama_stack.apis.common.type_system import ParamType
 from llama_stack.apis.resource import Resource, ResourceType
 
@@ -44,8 +42,12 @@ class DatasetInput(CommonDatasetFields, BaseModel):
     provider_dataset_id: Optional[str] = None
 
 
+class ListDatasetsResponse(BaseModel):
+    data: List[Dataset]
+
+
 class Datasets(Protocol):
-    @webmethod(route="/datasets/register", method="POST")
+    @webmethod(route="/datasets", method="POST")
     async def register_dataset(
         self,
         dataset_id: str,
@@ -56,16 +58,16 @@ class Datasets(Protocol):
         metadata: Optional[Dict[str, Any]] = None,
     ) -> None: ...
 
-    @webmethod(route="/datasets/get", method="GET")
+    @webmethod(route="/datasets/{dataset_id}", method="GET")
     async def get_dataset(
         self,
         dataset_id: str,
     ) -> Optional[Dataset]: ...
 
-    @webmethod(route="/datasets/list", method="GET")
-    async def list_datasets(self) -> List[Dataset]: ...
+    @webmethod(route="/datasets", method="GET")
+    async def list_datasets(self) -> ListDatasetsResponse: ...
 
-    @webmethod(route="/datasets/unregister", method="POST")
+    @webmethod(route="/datasets/{dataset_id}", method="DELETE")
     async def unregister_dataset(
         self,
         dataset_id: str,
diff --git a/llama_stack/apis/eval/eval.py b/llama_stack/apis/eval/eval.py
index 1073d6310..1b8f768ad 100644
--- a/llama_stack/apis/eval/eval.py
+++ b/llama_stack/apis/eval/eval.py
@@ -7,9 +7,7 @@
 from typing import Any, Dict, List, Literal, Optional, Protocol, Union
 
 from llama_models.schema_utils import json_schema_type, webmethod
-
 from pydantic import BaseModel, Field
-
 from typing_extensions import Annotated
 
 from llama_stack.apis.agents import AgentConfig
@@ -76,7 +74,7 @@ class EvaluateResponse(BaseModel):
 
 
 class Eval(Protocol):
-    @webmethod(route="/eval/run-eval", method="POST")
+    @webmethod(route="/eval/run", method="POST")
     async def run_eval(
         self,
         task_id: str,
@@ -92,11 +90,11 @@ class Eval(Protocol):
         task_config: EvalTaskConfig,
     ) -> EvaluateResponse: ...
 
-    @webmethod(route="/eval/job/status", method="GET")
-    async def job_status(self, task_id: str, job_id: str) -> Optional[JobStatus]: ...
+    @webmethod(route="/eval/jobs/{job_id}", method="GET")
+    async def job_status(self, job_id: str, task_id: str) -> Optional[JobStatus]: ...
 
-    @webmethod(route="/eval/job/cancel", method="POST")
-    async def job_cancel(self, task_id: str, job_id: str) -> None: ...
+    @webmethod(route="/eval/jobs/cancel", method="POST")
+    async def job_cancel(self, job_id: str, task_id: str) -> None: ...
 
-    @webmethod(route="/eval/job/result", method="GET")
-    async def job_result(self, task_id: str, job_id: str) -> EvaluateResponse: ...
+    @webmethod(route="/eval/jobs/{job_id}/result", method="GET")
+    async def job_result(self, job_id: str, task_id: str) -> EvaluateResponse: ...
diff --git a/llama_stack/apis/eval_tasks/eval_tasks.py b/llama_stack/apis/eval_tasks/eval_tasks.py
index 083681289..a0a533055 100644
--- a/llama_stack/apis/eval_tasks/eval_tasks.py
+++ b/llama_stack/apis/eval_tasks/eval_tasks.py
@@ -6,7 +6,6 @@
 from typing import Any, Dict, List, Literal, Optional, Protocol, runtime_checkable
 
 from llama_models.schema_utils import json_schema_type, webmethod
-
 from pydantic import BaseModel, Field
 
 from llama_stack.apis.resource import Resource, ResourceType
@@ -40,15 +39,22 @@ class EvalTaskInput(CommonEvalTaskFields, BaseModel):
     provider_eval_task_id: Optional[str] = None
 
 
+class ListEvalTasksResponse(BaseModel):
+    data: List[EvalTask]
+
+
 @runtime_checkable
 class EvalTasks(Protocol):
-    @webmethod(route="/eval-tasks/list", method="GET")
-    async def list_eval_tasks(self) -> List[EvalTask]: ...
+    @webmethod(route="/eval-tasks", method="GET")
+    async def list_eval_tasks(self) -> ListEvalTasksResponse: ...
 
-    @webmethod(route="/eval-tasks/get", method="GET")
-    async def get_eval_task(self, name: str) -> Optional[EvalTask]: ...
+    @webmethod(route="/eval-tasks/{eval_task_id}", method="GET")
+    async def get_eval_task(
+        self,
+        eval_task_id: str,
+    ) -> Optional[EvalTask]: ...
 
-    @webmethod(route="/eval-tasks/register", method="POST")
+    @webmethod(route="/eval-tasks", method="POST")
     async def register_eval_task(
         self,
         eval_task_id: str,
diff --git a/llama_stack/apis/inference/inference.py b/llama_stack/apis/inference/inference.py
index b525aa331..fdda5fe1b 100644
--- a/llama_stack/apis/inference/inference.py
+++ b/llama_stack/apis/inference/inference.py
@@ -291,7 +291,7 @@ class ModelStore(Protocol):
 class Inference(Protocol):
     model_store: ModelStore
 
-    @webmethod(route="/inference/completion")
+    @webmethod(route="/inference/completion", method="POST")
     async def completion(
         self,
         model_id: str,
@@ -302,7 +302,7 @@ class Inference(Protocol):
         logprobs: Optional[LogProbConfig] = None,
     ) -> Union[CompletionResponse, AsyncIterator[CompletionResponseStreamChunk]]: ...
 
-    @webmethod(route="/inference/chat-completion")
+    @webmethod(route="/inference/chat-completion", method="POST")
     async def chat_completion(
         self,
         model_id: str,
@@ -319,7 +319,7 @@ class Inference(Protocol):
         ChatCompletionResponse, AsyncIterator[ChatCompletionResponseStreamChunk]
     ]: ...
 
-    @webmethod(route="/inference/embeddings")
+    @webmethod(route="/inference/embeddings", method="POST")
     async def embeddings(
         self,
         model_id: str,
diff --git a/llama_stack/apis/inspect/inspect.py b/llama_stack/apis/inspect/inspect.py
index 699bce7b7..e2bb98217 100644
--- a/llama_stack/apis/inspect/inspect.py
+++ b/llama_stack/apis/inspect/inspect.py
@@ -34,10 +34,14 @@ class VersionInfo(BaseModel):
     version: str
 
 
+class ListProvidersResponse(BaseModel):
+    data: List[ProviderInfo]
+
+
 @runtime_checkable
 class Inspect(Protocol):
     @webmethod(route="/providers/list", method="GET")
-    async def list_providers(self) -> Dict[str, ProviderInfo]: ...
+    async def list_providers(self) -> ListProvidersResponse: ...
 
     @webmethod(route="/routes/list", method="GET")
     async def list_routes(self) -> Dict[str, List[RouteInfo]]: ...
diff --git a/llama_stack/apis/memory/memory.py b/llama_stack/apis/memory/memory.py
index 8096a107a..6e6fcf697 100644
--- a/llama_stack/apis/memory/memory.py
+++ b/llama_stack/apis/memory/memory.py
@@ -50,7 +50,7 @@ class Memory(Protocol):
 
     # this will just block now until documents are inserted, but it should
     # probably return a Job instance which can be polled for completion
-    @webmethod(route="/memory/insert")
+    @webmethod(route="/memory/insert", method="POST")
     async def insert_documents(
         self,
         bank_id: str,
@@ -58,7 +58,7 @@ class Memory(Protocol):
         ttl_seconds: Optional[int] = None,
     ) -> None: ...
 
-    @webmethod(route="/memory/query")
+    @webmethod(route="/memory/query", method="POST")
     async def query_documents(
         self,
         bank_id: str,
diff --git a/llama_stack/apis/memory_banks/memory_banks.py b/llama_stack/apis/memory_banks/memory_banks.py
index 21569beff..ec8ba824b 100644
--- a/llama_stack/apis/memory_banks/memory_banks.py
+++ b/llama_stack/apis/memory_banks/memory_banks.py
@@ -16,7 +16,6 @@ from typing import (
 )
 
 from llama_models.schema_utils import json_schema_type, register_schema, webmethod
-
 from pydantic import BaseModel, Field
 
 from llama_stack.apis.resource import Resource, ResourceType
@@ -133,16 +132,23 @@ class MemoryBankInput(BaseModel):
     provider_memory_bank_id: Optional[str] = None
 
 
+class ListMemoryBanksResponse(BaseModel):
+    data: List[MemoryBank]
+
+
 @runtime_checkable
 @trace_protocol
 class MemoryBanks(Protocol):
-    @webmethod(route="/memory-banks/list", method="GET")
-    async def list_memory_banks(self) -> List[MemoryBank]: ...
+    @webmethod(route="/memory-banks", method="GET")
+    async def list_memory_banks(self) -> ListMemoryBanksResponse: ...
 
-    @webmethod(route="/memory-banks/get", method="GET")
-    async def get_memory_bank(self, memory_bank_id: str) -> Optional[MemoryBank]: ...
+    @webmethod(route="/memory-banks/{memory_bank_id}", method="GET")
+    async def get_memory_bank(
+        self,
+        memory_bank_id: str,
+    ) -> Optional[MemoryBank]: ...
 
-    @webmethod(route="/memory-banks/register", method="POST")
+    @webmethod(route="/memory-banks", method="POST")
     async def register_memory_bank(
         self,
         memory_bank_id: str,
@@ -151,5 +157,5 @@ class MemoryBanks(Protocol):
         provider_memory_bank_id: Optional[str] = None,
     ) -> MemoryBank: ...
 
-    @webmethod(route="/memory-banks/unregister", method="POST")
+    @webmethod(route="/memory-banks/{memory_bank_id}", method="DELETE")
     async def unregister_memory_bank(self, memory_bank_id: str) -> None: ...
diff --git a/llama_stack/apis/models/models.py b/llama_stack/apis/models/models.py
index 0ee23ecc1..3361c2836 100644
--- a/llama_stack/apis/models/models.py
+++ b/llama_stack/apis/models/models.py
@@ -52,16 +52,23 @@ class ModelInput(CommonModelFields):
     model_config = ConfigDict(protected_namespaces=())
 
 
+class ListModelsResponse(BaseModel):
+    data: List[Model]
+
+
 @runtime_checkable
 @trace_protocol
 class Models(Protocol):
-    @webmethod(route="/models/list", method="GET")
-    async def list_models(self) -> List[Model]: ...
+    @webmethod(route="/models", method="GET")
+    async def list_models(self) -> ListModelsResponse: ...
 
-    @webmethod(route="/models/get", method="GET")
-    async def get_model(self, identifier: str) -> Optional[Model]: ...
+    @webmethod(route="/models/{model_id}", method="GET")
+    async def get_model(
+        self,
+        model_id: str,
+    ) -> Optional[Model]: ...
 
-    @webmethod(route="/models/register", method="POST")
+    @webmethod(route="/models", method="POST")
     async def register_model(
         self,
         model_id: str,
@@ -71,5 +78,8 @@ class Models(Protocol):
         model_type: Optional[ModelType] = None,
     ) -> Model: ...
 
-    @webmethod(route="/models/unregister", method="POST")
-    async def unregister_model(self, model_id: str) -> None: ...
+    @webmethod(route="/models/{model_id}", method="DELETE")
+    async def unregister_model(
+        self,
+        model_id: str,
+    ) -> None: ...
diff --git a/llama_stack/apis/post_training/post_training.py b/llama_stack/apis/post_training/post_training.py
index 8841dc1d0..b9aa3bbde 100644
--- a/llama_stack/apis/post_training/post_training.py
+++ b/llama_stack/apis/post_training/post_training.py
@@ -6,16 +6,13 @@
 
 from datetime import datetime
 from enum import Enum
-
 from typing import Any, Dict, List, Literal, Optional, Protocol, Union
 
 from llama_models.schema_utils import json_schema_type, webmethod
-
 from pydantic import BaseModel, Field
 from typing_extensions import Annotated
 
 from llama_stack.apis.common.content_types import URL
-
 from llama_stack.apis.common.job_types import JobStatus
 from llama_stack.apis.common.training_types import Checkpoint
 
@@ -159,6 +156,10 @@ class PostTrainingJobStatusResponse(BaseModel):
     checkpoints: List[Checkpoint] = Field(default_factory=list)
 
 
+class ListPostTrainingJobsResponse(BaseModel):
+    data: List[PostTrainingJob]
+
+
 @json_schema_type
 class PostTrainingJobArtifactsResponse(BaseModel):
     """Artifacts of a finetuning job."""
@@ -197,7 +198,7 @@ class PostTraining(Protocol):
     ) -> PostTrainingJob: ...
 
     @webmethod(route="/post-training/jobs", method="GET")
-    async def get_training_jobs(self) -> List[PostTrainingJob]: ...
+    async def get_training_jobs(self) -> ListPostTrainingJobsResponse: ...
 
     @webmethod(route="/post-training/job/status", method="GET")
     async def get_training_job_status(
diff --git a/llama_stack/apis/safety/safety.py b/llama_stack/apis/safety/safety.py
index dd24642b1..513733d1e 100644
--- a/llama_stack/apis/safety/safety.py
+++ b/llama_stack/apis/safety/safety.py
@@ -12,7 +12,6 @@ from pydantic import BaseModel, Field
 
 from llama_stack.apis.inference import Message
 from llama_stack.apis.shields import Shield
-
 from llama_stack.providers.utils.telemetry.trace_protocol import trace_protocol
 
 
@@ -49,7 +48,7 @@ class ShieldStore(Protocol):
 class Safety(Protocol):
     shield_store: ShieldStore
 
-    @webmethod(route="/safety/run-shield")
+    @webmethod(route="/safety/run-shield", method="POST")
     async def run_shield(
         self,
         shield_id: str,
diff --git a/llama_stack/apis/scoring/scoring.py b/llama_stack/apis/scoring/scoring.py
index 996291dcc..5bacaaf66 100644
--- a/llama_stack/apis/scoring/scoring.py
+++ b/llama_stack/apis/scoring/scoring.py
@@ -11,7 +11,6 @@ from pydantic import BaseModel
 
 from llama_stack.apis.scoring_functions import ScoringFn, ScoringFnParams
 
-
 # mapping of metric to value
 ScoringResultRow = Dict[str, Any]
 
@@ -43,7 +42,7 @@ class ScoringFunctionStore(Protocol):
 class Scoring(Protocol):
     scoring_function_store: ScoringFunctionStore
 
-    @webmethod(route="/scoring/score-batch")
+    @webmethod(route="/scoring/score-batch", method="POST")
     async def score_batch(
         self,
         dataset_id: str,
@@ -51,7 +50,7 @@ class Scoring(Protocol):
         save_results_dataset: bool = False,
     ) -> ScoreBatchResponse: ...
 
-    @webmethod(route="/scoring/score")
+    @webmethod(route="/scoring/score", method="POST")
     async def score(
         self,
         input_rows: List[Dict[str, Any]],
diff --git a/llama_stack/apis/scoring_functions/scoring_functions.py b/llama_stack/apis/scoring_functions/scoring_functions.py
index fc57cfbbf..3089dc0a4 100644
--- a/llama_stack/apis/scoring_functions/scoring_functions.py
+++ b/llama_stack/apis/scoring_functions/scoring_functions.py
@@ -21,7 +21,6 @@ from pydantic import BaseModel, Field
 from typing_extensions import Annotated
 
 from llama_stack.apis.common.type_system import ParamType
-
 from llama_stack.apis.resource import Resource, ResourceType
 
 
@@ -129,15 +128,21 @@ class ScoringFnInput(CommonScoringFnFields, BaseModel):
     provider_scoring_fn_id: Optional[str] = None
 
 
+class ListScoringFunctionsResponse(BaseModel):
+    data: List[ScoringFn]
+
+
 @runtime_checkable
 class ScoringFunctions(Protocol):
-    @webmethod(route="/scoring-functions/list", method="GET")
-    async def list_scoring_functions(self) -> List[ScoringFn]: ...
+    @webmethod(route="/scoring-functions", method="GET")
+    async def list_scoring_functions(self) -> ListScoringFunctionsResponse: ...
 
-    @webmethod(route="/scoring-functions/get", method="GET")
-    async def get_scoring_function(self, scoring_fn_id: str) -> Optional[ScoringFn]: ...
+    @webmethod(route="/scoring-functions/{scoring_fn_id}", method="GET")
+    async def get_scoring_function(
+        self, scoring_fn_id: str, /
+    ) -> Optional[ScoringFn]: ...
 
-    @webmethod(route="/scoring-functions/register", method="POST")
+    @webmethod(route="/scoring-functions", method="POST")
     async def register_scoring_function(
         self,
         scoring_fn_id: str,
diff --git a/llama_stack/apis/shields/shields.py b/llama_stack/apis/shields/shields.py
index 8d4d5f9fd..3dd685b14 100644
--- a/llama_stack/apis/shields/shields.py
+++ b/llama_stack/apis/shields/shields.py
@@ -38,16 +38,20 @@ class ShieldInput(CommonShieldFields):
     provider_shield_id: Optional[str] = None
 
 
+class ListShieldsResponse(BaseModel):
+    data: List[Shield]
+
+
 @runtime_checkable
 @trace_protocol
 class Shields(Protocol):
-    @webmethod(route="/shields/list", method="GET")
-    async def list_shields(self) -> List[Shield]: ...
+    @webmethod(route="/shields", method="GET")
+    async def list_shields(self) -> ListShieldsResponse: ...
 
-    @webmethod(route="/shields/get", method="GET")
+    @webmethod(route="/shields/{identifier}", method="GET")
     async def get_shield(self, identifier: str) -> Optional[Shield]: ...
 
-    @webmethod(route="/shields/register", method="POST")
+    @webmethod(route="/shields", method="POST")
     async def register_shield(
         self,
         shield_id: str,
diff --git a/llama_stack/apis/telemetry/telemetry.py b/llama_stack/apis/telemetry/telemetry.py
index 23a475bff..d04cb67e3 100644
--- a/llama_stack/apis/telemetry/telemetry.py
+++ b/llama_stack/apis/telemetry/telemetry.py
@@ -185,8 +185,8 @@ class Telemetry(Protocol):
         order_by: Optional[List[str]] = None,
     ) -> List[Trace]: ...
 
-    @webmethod(route="/telemetry/get-span-tree", method="POST")
-    async def get_span_tree(
+    @webmethod(route="/telemetry/query-span-tree", method="POST")
+    async def query_span_tree(
         self,
         span_id: str,
         attributes_to_return: Optional[List[str]] = None,
diff --git a/llama_stack/apis/tools/tools.py b/llama_stack/apis/tools/tools.py
index d2bdf9873..fb990cc41 100644
--- a/llama_stack/apis/tools/tools.py
+++ b/llama_stack/apis/tools/tools.py
@@ -74,13 +74,21 @@ class ToolInvocationResult(BaseModel):
 
 class ToolStore(Protocol):
     def get_tool(self, tool_name: str) -> Tool: ...
-    def get_tool_group(self, tool_group_id: str) -> ToolGroup: ...
+    def get_tool_group(self, toolgroup_id: str) -> ToolGroup: ...
+
+
+class ListToolGroupsResponse(BaseModel):
+    data: List[ToolGroup]
+
+
+class ListToolsResponse(BaseModel):
+    data: List[Tool]
 
 
 @runtime_checkable
 @trace_protocol
 class ToolGroups(Protocol):
-    @webmethod(route="/toolgroups/register", method="POST")
+    @webmethod(route="/toolgroups", method="POST")
     async def register_tool_group(
         self,
         toolgroup_id: str,
@@ -91,27 +99,33 @@ class ToolGroups(Protocol):
         """Register a tool group"""
         ...
 
-    @webmethod(route="/toolgroups/get", method="GET")
+    @webmethod(route="/toolgroups/{toolgroup_id}", method="GET")
     async def get_tool_group(
         self,
         toolgroup_id: str,
     ) -> ToolGroup: ...
 
-    @webmethod(route="/toolgroups/list", method="GET")
-    async def list_tool_groups(self) -> List[ToolGroup]:
+    @webmethod(route="/toolgroups", method="GET")
+    async def list_tool_groups(self) -> ListToolGroupsResponse:
         """List tool groups with optional provider"""
         ...
 
-    @webmethod(route="/tools/list", method="GET")
-    async def list_tools(self, tool_group_id: Optional[str] = None) -> List[Tool]:
+    @webmethod(route="/tools", method="GET")
+    async def list_tools(self, toolgroup_id: Optional[str] = None) -> ListToolsResponse:
         """List tools with optional tool group"""
         ...
 
-    @webmethod(route="/tools/get", method="GET")
-    async def get_tool(self, tool_name: str) -> Tool: ...
+    @webmethod(route="/tools/{tool_name}", method="GET")
+    async def get_tool(
+        self,
+        tool_name: str,
+    ) -> Tool: ...
 
-    @webmethod(route="/toolgroups/unregister", method="POST")
-    async def unregister_tool_group(self, tool_group_id: str) -> None:
+    @webmethod(route="/toolgroups/{toolgroup_id}", method="DELETE")
+    async def unregister_toolgroup(
+        self,
+        toolgroup_id: str,
+    ) -> None:
         """Unregister a tool group"""
         ...
 
diff --git a/llama_stack/distribution/routers/routing_tables.py b/llama_stack/distribution/routers/routing_tables.py
index a3a64bf6b..e02606936 100644
--- a/llama_stack/distribution/routers/routing_tables.py
+++ b/llama_stack/distribution/routers/routing_tables.py
@@ -10,23 +10,32 @@ from pydantic import TypeAdapter
 
 from llama_stack.apis.common.content_types import URL
 from llama_stack.apis.common.type_system import ParamType
-from llama_stack.apis.datasets import Dataset, Datasets
-from llama_stack.apis.eval_tasks import EvalTask, EvalTasks
+from llama_stack.apis.datasets import Dataset, Datasets, ListDatasetsResponse
+from llama_stack.apis.eval_tasks import EvalTask, EvalTasks, ListEvalTasksResponse
 from llama_stack.apis.memory_banks import (
     BankParams,
+    ListMemoryBanksResponse,
     MemoryBank,
     MemoryBanks,
     MemoryBankType,
 )
-from llama_stack.apis.models import Model, Models, ModelType
+from llama_stack.apis.models import ListModelsResponse, Model, Models, ModelType
 from llama_stack.apis.resource import ResourceType
 from llama_stack.apis.scoring_functions import (
+    ListScoringFunctionsResponse,
     ScoringFn,
     ScoringFnParams,
     ScoringFunctions,
 )
-from llama_stack.apis.shields import Shield, Shields
-from llama_stack.apis.tools import Tool, ToolGroup, ToolGroups, ToolHost
+from llama_stack.apis.shields import ListShieldsResponse, Shield, Shields
+from llama_stack.apis.tools import (
+    ListToolGroupsResponse,
+    ListToolsResponse,
+    Tool,
+    ToolGroup,
+    ToolGroups,
+    ToolHost,
+)
 from llama_stack.distribution.datatypes import (
     RoutableObject,
     RoutableObjectWithProvider,
@@ -215,11 +224,11 @@ class CommonRoutingTableImpl(RoutingTable):
 
 
 class ModelsRoutingTable(CommonRoutingTableImpl, Models):
-    async def list_models(self) -> List[Model]:
-        return await self.get_all_with_type("model")
+    async def list_models(self) -> ListModelsResponse:
+        return ListModelsResponse(data=await self.get_all_with_type("model"))
 
-    async def get_model(self, identifier: str) -> Optional[Model]:
-        return await self.get_object_by_identifier("model", identifier)
+    async def get_model(self, model_id: str) -> Optional[Model]:
+        return await self.get_object_by_identifier("model", model_id)
 
     async def register_model(
         self,
@@ -265,8 +274,10 @@ class ModelsRoutingTable(CommonRoutingTableImpl, Models):
 
 
 class ShieldsRoutingTable(CommonRoutingTableImpl, Shields):
-    async def list_shields(self) -> List[Shield]:
-        return await self.get_all_with_type(ResourceType.shield.value)
+    async def list_shields(self) -> ListShieldsResponse:
+        return ListShieldsResponse(
+            data=await self.get_all_with_type(ResourceType.shield.value)
+        )
 
     async def get_shield(self, identifier: str) -> Optional[Shield]:
         return await self.get_object_by_identifier("shield", identifier)
@@ -301,8 +312,8 @@ class ShieldsRoutingTable(CommonRoutingTableImpl, Shields):
 
 
 class MemoryBanksRoutingTable(CommonRoutingTableImpl, MemoryBanks):
-    async def list_memory_banks(self) -> List[MemoryBank]:
-        return await self.get_all_with_type(ResourceType.memory_bank.value)
+    async def list_memory_banks(self) -> ListMemoryBanksResponse:
+        return ListMemoryBanksResponse(data=await self.get_all_with_type("memory_bank"))
 
     async def get_memory_bank(self, memory_bank_id: str) -> Optional[MemoryBank]:
         return await self.get_object_by_identifier("memory_bank", memory_bank_id)
@@ -365,8 +376,10 @@ class MemoryBanksRoutingTable(CommonRoutingTableImpl, MemoryBanks):
 
 
 class DatasetsRoutingTable(CommonRoutingTableImpl, Datasets):
-    async def list_datasets(self) -> List[Dataset]:
-        return await self.get_all_with_type(ResourceType.dataset.value)
+    async def list_datasets(self) -> ListDatasetsResponse:
+        return ListDatasetsResponse(
+            data=await self.get_all_with_type(ResourceType.dataset.value)
+        )
 
     async def get_dataset(self, dataset_id: str) -> Optional[Dataset]:
         return await self.get_object_by_identifier("dataset", dataset_id)
@@ -410,8 +423,10 @@ class DatasetsRoutingTable(CommonRoutingTableImpl, Datasets):
 
 
 class ScoringFunctionsRoutingTable(CommonRoutingTableImpl, ScoringFunctions):
-    async def list_scoring_functions(self) -> List[ScoringFn]:
-        return await self.get_all_with_type(ResourceType.scoring_function.value)
+    async def list_scoring_functions(self) -> ListScoringFunctionsResponse:
+        return ListScoringFunctionsResponse(
+            data=await self.get_all_with_type(ResourceType.scoring_function.value)
+        )
 
     async def get_scoring_function(self, scoring_fn_id: str) -> Optional[ScoringFn]:
         return await self.get_object_by_identifier("scoring_function", scoring_fn_id)
@@ -447,11 +462,11 @@ class ScoringFunctionsRoutingTable(CommonRoutingTableImpl, ScoringFunctions):
 
 
 class EvalTasksRoutingTable(CommonRoutingTableImpl, EvalTasks):
-    async def list_eval_tasks(self) -> List[EvalTask]:
-        return await self.get_all_with_type(ResourceType.eval_task.value)
+    async def list_eval_tasks(self) -> ListEvalTasksResponse:
+        return ListEvalTasksResponse(data=await self.get_all_with_type("eval_task"))
 
-    async def get_eval_task(self, name: str) -> Optional[EvalTask]:
-        return await self.get_object_by_identifier("eval_task", name)
+    async def get_eval_task(self, eval_task_id: str) -> Optional[EvalTask]:
+        return await self.get_object_by_identifier("eval_task", eval_task_id)
 
     async def register_eval_task(
         self,
@@ -485,14 +500,14 @@ class EvalTasksRoutingTable(CommonRoutingTableImpl, EvalTasks):
 
 
 class ToolGroupsRoutingTable(CommonRoutingTableImpl, ToolGroups):
-    async def list_tools(self, tool_group_id: Optional[str] = None) -> List[Tool]:
+    async def list_tools(self, toolgroup_id: Optional[str] = None) -> ListToolsResponse:
         tools = await self.get_all_with_type("tool")
-        if tool_group_id:
-            tools = [tool for tool in tools if tool.toolgroup_id == tool_group_id]
-        return tools
+        if toolgroup_id:
+            tools = [tool for tool in tools if tool.toolgroup_id == toolgroup_id]
+        return ListToolsResponse(data=tools)
 
-    async def list_tool_groups(self) -> List[ToolGroup]:
-        return await self.get_all_with_type("tool_group")
+    async def list_tool_groups(self) -> ListToolGroupsResponse:
+        return ListToolGroupsResponse(data=await self.get_all_with_type("tool_group"))
 
     async def get_tool_group(self, toolgroup_id: str) -> ToolGroup:
         return await self.get_object_by_identifier("tool_group", toolgroup_id)
@@ -551,11 +566,11 @@ class ToolGroupsRoutingTable(CommonRoutingTableImpl, ToolGroups):
             )
         )
 
-    async def unregister_tool_group(self, tool_group_id: str) -> None:
-        tool_group = await self.get_tool_group(tool_group_id)
+    async def unregister_toolgroup(self, toolgroup_id: str) -> None:
+        tool_group = await self.get_tool_group(toolgroup_id)
         if tool_group is None:
-            raise ValueError(f"Tool group {tool_group_id} not found")
-        tools = await self.list_tools(tool_group_id)
+            raise ValueError(f"Tool group {toolgroup_id} not found")
+        tools = await self.list_tools(toolgroup_id).data
         for tool in tools:
             await self.unregister_object(tool)
         await self.unregister_object(tool_group)
diff --git a/llama_stack/distribution/server/server.py b/llama_stack/distribution/server/server.py
index 34334de77..2d216d314 100644
--- a/llama_stack/distribution/server/server.py
+++ b/llama_stack/distribution/server/server.py
@@ -14,16 +14,13 @@ import signal
 import sys
 import traceback
 import warnings
-
 from contextlib import asynccontextmanager
-
 from importlib.metadata import version as parse_version
 from pathlib import Path
-from typing import Any, Union
+from typing import Any, List, Union
 
 import yaml
-
-from fastapi import Body, FastAPI, HTTPException, Request
+from fastapi import Body, FastAPI, HTTPException, Path as FastapiPath, Request
 from fastapi.exceptions import RequestValidationError
 from fastapi.responses import JSONResponse, StreamingResponse
 from pydantic import BaseModel, ValidationError
@@ -31,7 +28,6 @@ from termcolor import cprint
 from typing_extensions import Annotated
 
 from llama_stack.distribution.datatypes import StackRunConfig
-
 from llama_stack.distribution.distribution import builtin_automatically_routed_apis
 from llama_stack.distribution.request_headers import set_request_provider_data
 from llama_stack.distribution.resolver import InvalidProviderError
@@ -41,13 +37,11 @@ from llama_stack.distribution.stack import (
     replace_env_vars,
     validate_env_pair,
 )
-
 from llama_stack.providers.datatypes import Api
 from llama_stack.providers.inline.telemetry.meta_reference.config import TelemetryConfig
 from llama_stack.providers.inline.telemetry.meta_reference.telemetry import (
     TelemetryAdapter,
 )
-
 from llama_stack.providers.utils.telemetry.tracing import (
     end_trace,
     setup_logger,
@@ -56,7 +50,6 @@ from llama_stack.providers.utils.telemetry.tracing import (
 
 from .endpoints import get_all_api_endpoints
 
-
 REPO_ROOT = Path(__file__).parent.parent.parent.parent
 
 
@@ -178,7 +171,7 @@ async def sse_generator(event_gen):
         )
 
 
-def create_dynamic_typed_route(func: Any, method: str):
+def create_dynamic_typed_route(func: Any, method: str, route: str):
     async def endpoint(request: Request, **kwargs):
         set_request_provider_data(request.headers)
 
@@ -196,6 +189,7 @@ def create_dynamic_typed_route(func: Any, method: str):
             raise translate_exception(e) from e
 
     sig = inspect.signature(func)
+
     new_params = [
         inspect.Parameter(
             "request", inspect.Parameter.POSITIONAL_OR_KEYWORD, annotation=Request
@@ -203,12 +197,21 @@ def create_dynamic_typed_route(func: Any, method: str):
     ]
     new_params.extend(sig.parameters.values())
 
+    path_params = extract_path_params(route)
     if method == "post":
-        # make sure every parameter is annotated with Body() so FASTAPI doesn't
-        # do anything too intelligent and ask for some parameters in the query
-        # and some in the body
+        # Annotate parameters that are in the path with Path(...) and others with Body(...)
         new_params = [new_params[0]] + [
-            param.replace(annotation=Annotated[param.annotation, Body(..., embed=True)])
+            (
+                param.replace(
+                    annotation=Annotated[
+                        param.annotation, FastapiPath(..., title=param.name)
+                    ]
+                )
+                if param.name in path_params
+                else param.replace(
+                    annotation=Annotated[param.annotation, Body(..., embed=True)]
+                )
+            )
             for param in new_params[1:]
         ]
 
@@ -386,6 +389,7 @@ def main():
                     create_dynamic_typed_route(
                         impl_method,
                         endpoint.method,
+                        endpoint.route,
                     )
                 )
 
@@ -409,5 +413,13 @@ def main():
     uvicorn.run(app, host=listen_host, port=args.port)
 
 
+def extract_path_params(route: str) -> List[str]:
+    segments = route.split("/")
+    params = [
+        seg[1:-1] for seg in segments if seg.startswith("{") and seg.endswith("}")
+    ]
+    return params
+
+
 if __name__ == "__main__":
     main()
diff --git a/llama_stack/distribution/stack.py b/llama_stack/distribution/stack.py
index e3edf1e16..ad7bcd234 100644
--- a/llama_stack/distribution/stack.py
+++ b/llama_stack/distribution/stack.py
@@ -93,7 +93,11 @@ async def register_resources(run_config: StackRunConfig, impls: Dict[Api, Any]):
             await method(**obj.model_dump())
 
         method = getattr(impls[api], list_method)
-        for obj in await method():
+        response = await method()
+
+        objects_to_process = response.data if hasattr(response, "data") else response
+
+        for obj in objects_to_process:
             log.info(
                 f"{rsrc.capitalize()}: {colored(obj.identifier, 'white', attrs=['bold'])} served by {colored(obj.provider_id, 'white', attrs=['bold'])}",
             )
diff --git a/llama_stack/providers/inline/agents/meta_reference/agent_instance.py b/llama_stack/providers/inline/agents/meta_reference/agent_instance.py
index 2299e80d1..2ebc7ded1 100644
--- a/llama_stack/providers/inline/agents/meta_reference/agent_instance.py
+++ b/llama_stack/providers/inline/agents/meta_reference/agent_instance.py
@@ -624,6 +624,10 @@ class ChatAgent(ShieldRunnerMixin):
                             step_type=StepType.tool_execution.value,
                             step_id=step_id,
                             tool_call=tool_call,
+                            delta=ToolCallDelta(
+                                parse_status=ToolCallParseStatus.in_progress,
+                                content=tool_call,
+                            ),
                         )
                     )
                 )
@@ -735,8 +739,8 @@ class ChatAgent(ShieldRunnerMixin):
         for toolgroup_name in agent_config_toolgroups:
             if toolgroup_name not in toolgroups_for_turn_set:
                 continue
-            tools = await self.tool_groups_api.list_tools(tool_group_id=toolgroup_name)
-            for tool_def in tools:
+            tools = await self.tool_groups_api.list_tools(toolgroup_id=toolgroup_name)
+            for tool_def in tools.data:
                 if (
                     toolgroup_name.startswith("builtin")
                     and toolgroup_name != MEMORY_GROUP
diff --git a/llama_stack/providers/inline/agents/meta_reference/agents.py b/llama_stack/providers/inline/agents/meta_reference/agents.py
index faff716ce..d22ef82ab 100644
--- a/llama_stack/providers/inline/agents/meta_reference/agents.py
+++ b/llama_stack/providers/inline/agents/meta_reference/agents.py
@@ -223,5 +223,5 @@ class MetaReferenceAgentsImpl(Agents):
     async def delete_agents_session(self, agent_id: str, session_id: str) -> None:
         await self.persistence_store.delete(f"session:{agent_id}:{session_id}")
 
-    async def delete_agents(self, agent_id: str) -> None:
+    async def delete_agent(self, agent_id: str) -> None:
         await self.persistence_store.delete(f"agent:{agent_id}")
diff --git a/llama_stack/providers/inline/post_training/torchtune/post_training.py b/llama_stack/providers/inline/post_training/torchtune/post_training.py
index 90fbf7026..4abe13de2 100644
--- a/llama_stack/providers/inline/post_training/torchtune/post_training.py
+++ b/llama_stack/providers/inline/post_training/torchtune/post_training.py
@@ -4,7 +4,7 @@
 # This source code is licensed under the terms described in the LICENSE file in
 # the root directory of this source tree.
 from datetime import datetime
-from typing import Any, Dict, List, Optional
+from typing import Any, Dict, Optional
 
 from llama_models.schema_utils import webmethod
 
@@ -14,6 +14,7 @@ from llama_stack.apis.post_training import (
     AlgorithmConfig,
     DPOAlignmentConfig,
     JobStatus,
+    ListPostTrainingJobsResponse,
     LoraFinetuningConfig,
     PostTrainingJob,
     PostTrainingJobArtifactsResponse,
@@ -114,8 +115,8 @@ class TorchtunePostTrainingImpl:
         logger_config: Dict[str, Any],
     ) -> PostTrainingJob: ...
 
-    async def get_training_jobs(self) -> List[PostTrainingJob]:
-        return self.jobs_list
+    async def get_training_jobs(self) -> ListPostTrainingJobsResponse:
+        return ListPostTrainingJobsResponse(data=self.jobs_list)
 
     @webmethod(route="/post-training/job/status")
     async def get_training_job_status(
diff --git a/llama_stack/providers/inline/telemetry/meta_reference/telemetry.py b/llama_stack/providers/inline/telemetry/meta_reference/telemetry.py
index 332a150cf..e2e318375 100644
--- a/llama_stack/providers/inline/telemetry/meta_reference/telemetry.py
+++ b/llama_stack/providers/inline/telemetry/meta_reference/telemetry.py
@@ -249,7 +249,7 @@ class TelemetryAdapter(TelemetryDatasetMixin, Telemetry):
             order_by=order_by,
         )
 
-    async def get_span_tree(
+    async def query_span_tree(
         self,
         span_id: str,
         attributes_to_return: Optional[List[str]] = None,
diff --git a/tests/client-sdk/agents/test_agents.py b/tests/client-sdk/agents/test_agents.py
index 19a4064a0..747b64dd1 100644
--- a/tests/client-sdk/agents/test_agents.py
+++ b/tests/client-sdk/agents/test_agents.py
@@ -83,13 +83,13 @@ class TestClientTool(ClientTool):
 def agent_config(llama_stack_client):
     available_models = [
         model.identifier
-        for model in llama_stack_client.models.list()
+        for model in llama_stack_client.models.list().data
         if model.identifier.startswith("meta-llama") and "405" not in model.identifier
     ]
     model_id = available_models[0]
     print(f"Using model: {model_id}")
     available_shields = [
-        shield.identifier for shield in llama_stack_client.shields.list()
+        shield.identifier for shield in llama_stack_client.shields.list().data
     ]
     available_shields = available_shields[:1]
     print(f"Using shield: {available_shields}")