mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-10-24 00:47:00 +00:00
5553 lines
225 KiB
HTML
5553 lines
225 KiB
HTML
<!DOCTYPE html>
|
|
<html>
|
|
|
|
<head>
|
|
<meta charset="utf-8" />
|
|
<meta name="viewport" content="width=device-width, initial-scale=1">
|
|
<title>OpenAPI specification</title>
|
|
<link href="https://fonts.googleapis.com/css?family=Montserrat:300,400,700|Roboto:300,400,700" rel="stylesheet">
|
|
<script type="module" src="https://cdn.jsdelivr.net/npm/@stoplight/elements/web-components.min.js"></script>
|
|
<link rel="stylesheet" href="https://cdn.jsdelivr.net/npm/@stoplight/elements/styles.min.css">
|
|
<style>
|
|
body {
|
|
margin: 0;
|
|
padding: 0;
|
|
height: 100vh;
|
|
}
|
|
|
|
elements-api {
|
|
height: 100%;
|
|
}
|
|
</style>
|
|
</head>
|
|
|
|
<body>
|
|
<elements-api id="openapi-container" router="hash" layout="sidebar" hideExport="true"
|
|
hideInternal="true"></elements-api>
|
|
|
|
<script>
|
|
document.addEventListener("DOMContentLoaded", function () {
|
|
const spec = {
|
|
"openapi": "3.1.0",
|
|
"info": {
|
|
"title": "Llama Stack Specification - Experimental APIs",
|
|
"version": "v1",
|
|
"description": "This is the specification of the Llama Stack that provides\n a set of endpoints and their corresponding interfaces that are tailored to\n best leverage Llama Models.\n\n**🧪 EXPERIMENTAL**: Pre-release APIs (v1alpha, v1beta) that may change before becoming stable."
|
|
},
|
|
"servers": [
|
|
{
|
|
"url": "http://any-hosted-llama-stack.com"
|
|
}
|
|
],
|
|
"paths": {
|
|
"/v1beta/datasetio/append-rows/{dataset_id}": {
|
|
"post": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "OK"
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"DatasetIO"
|
|
],
|
|
"summary": "Append rows to a dataset.",
|
|
"description": "Append rows to a dataset.",
|
|
"parameters": [
|
|
{
|
|
"name": "dataset_id",
|
|
"in": "path",
|
|
"description": "The ID of the dataset to append the rows to.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
}
|
|
],
|
|
"requestBody": {
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/AppendRowsRequest"
|
|
}
|
|
}
|
|
},
|
|
"required": true
|
|
},
|
|
"deprecated": false
|
|
}
|
|
},
|
|
"/v1beta/datasetio/iterrows/{dataset_id}": {
|
|
"get": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "A PaginatedResponse.",
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/PaginatedResponse"
|
|
}
|
|
}
|
|
}
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"DatasetIO"
|
|
],
|
|
"summary": "Get a paginated list of rows from a dataset.",
|
|
"description": "Get a paginated list of rows from a dataset.\nUses offset-based pagination where:\n- start_index: The starting index (0-based). If None, starts from beginning.\n- limit: Number of items to return. If None or -1, returns all items.\n\nThe response includes:\n- data: List of items for the current page.\n- has_more: Whether there are more items available after this set.",
|
|
"parameters": [
|
|
{
|
|
"name": "dataset_id",
|
|
"in": "path",
|
|
"description": "The ID of the dataset to get the rows from.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
},
|
|
{
|
|
"name": "start_index",
|
|
"in": "query",
|
|
"description": "Index into dataset for the first row to get. Get all rows if None.",
|
|
"required": false,
|
|
"schema": {
|
|
"type": "integer"
|
|
}
|
|
},
|
|
{
|
|
"name": "limit",
|
|
"in": "query",
|
|
"description": "The number of rows to get.",
|
|
"required": false,
|
|
"schema": {
|
|
"type": "integer"
|
|
}
|
|
}
|
|
],
|
|
"deprecated": false
|
|
}
|
|
},
|
|
"/v1beta/datasets": {
|
|
"get": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "A ListDatasetsResponse.",
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/ListDatasetsResponse"
|
|
}
|
|
}
|
|
}
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"Datasets"
|
|
],
|
|
"summary": "List all datasets.",
|
|
"description": "List all datasets.",
|
|
"parameters": [],
|
|
"deprecated": false
|
|
},
|
|
"post": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "A Dataset.",
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/Dataset"
|
|
}
|
|
}
|
|
}
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"Datasets"
|
|
],
|
|
"summary": "Register a new dataset.",
|
|
"description": "Register a new dataset.",
|
|
"parameters": [],
|
|
"requestBody": {
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/RegisterDatasetRequest"
|
|
}
|
|
}
|
|
},
|
|
"required": true
|
|
},
|
|
"deprecated": false
|
|
}
|
|
},
|
|
"/v1beta/datasets/{dataset_id}": {
|
|
"get": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "A Dataset.",
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/Dataset"
|
|
}
|
|
}
|
|
}
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"Datasets"
|
|
],
|
|
"summary": "Get a dataset by its ID.",
|
|
"description": "Get a dataset by its ID.",
|
|
"parameters": [
|
|
{
|
|
"name": "dataset_id",
|
|
"in": "path",
|
|
"description": "The ID of the dataset to get.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
}
|
|
],
|
|
"deprecated": false
|
|
},
|
|
"delete": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "OK"
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"Datasets"
|
|
],
|
|
"summary": "Unregister a dataset by its ID.",
|
|
"description": "Unregister a dataset by its ID.",
|
|
"parameters": [
|
|
{
|
|
"name": "dataset_id",
|
|
"in": "path",
|
|
"description": "The ID of the dataset to unregister.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
}
|
|
],
|
|
"deprecated": false
|
|
}
|
|
},
|
|
"/v1alpha/agents": {
|
|
"get": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "A PaginatedResponse.",
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/PaginatedResponse"
|
|
}
|
|
}
|
|
}
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"Agents"
|
|
],
|
|
"summary": "List all agents.",
|
|
"description": "List all agents.",
|
|
"parameters": [
|
|
{
|
|
"name": "start_index",
|
|
"in": "query",
|
|
"description": "The index to start the pagination from.",
|
|
"required": false,
|
|
"schema": {
|
|
"type": "integer"
|
|
}
|
|
},
|
|
{
|
|
"name": "limit",
|
|
"in": "query",
|
|
"description": "The number of agents to return.",
|
|
"required": false,
|
|
"schema": {
|
|
"type": "integer"
|
|
}
|
|
}
|
|
],
|
|
"deprecated": false
|
|
},
|
|
"post": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "An AgentCreateResponse with the agent ID.",
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/AgentCreateResponse"
|
|
}
|
|
}
|
|
}
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"Agents"
|
|
],
|
|
"summary": "Create an agent with the given configuration.",
|
|
"description": "Create an agent with the given configuration.",
|
|
"parameters": [],
|
|
"requestBody": {
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/CreateAgentRequest"
|
|
}
|
|
}
|
|
},
|
|
"required": true
|
|
},
|
|
"deprecated": false
|
|
}
|
|
},
|
|
"/v1alpha/agents/{agent_id}": {
|
|
"get": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "An Agent of the agent.",
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/Agent"
|
|
}
|
|
}
|
|
}
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"Agents"
|
|
],
|
|
"summary": "Describe an agent by its ID.",
|
|
"description": "Describe an agent by its ID.",
|
|
"parameters": [
|
|
{
|
|
"name": "agent_id",
|
|
"in": "path",
|
|
"description": "ID of the agent.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
}
|
|
],
|
|
"deprecated": false
|
|
},
|
|
"delete": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "OK"
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"Agents"
|
|
],
|
|
"summary": "Delete an agent by its ID and its associated sessions and turns.",
|
|
"description": "Delete an agent by its ID and its associated sessions and turns.",
|
|
"parameters": [
|
|
{
|
|
"name": "agent_id",
|
|
"in": "path",
|
|
"description": "The ID of the agent to delete.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
}
|
|
],
|
|
"deprecated": false
|
|
}
|
|
},
|
|
"/v1alpha/agents/{agent_id}/session": {
|
|
"post": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "An AgentSessionCreateResponse.",
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/AgentSessionCreateResponse"
|
|
}
|
|
}
|
|
}
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"Agents"
|
|
],
|
|
"summary": "Create a new session for an agent.",
|
|
"description": "Create a new session for an agent.",
|
|
"parameters": [
|
|
{
|
|
"name": "agent_id",
|
|
"in": "path",
|
|
"description": "The ID of the agent to create the session for.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
}
|
|
],
|
|
"requestBody": {
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/CreateAgentSessionRequest"
|
|
}
|
|
}
|
|
},
|
|
"required": true
|
|
},
|
|
"deprecated": false
|
|
}
|
|
},
|
|
"/v1alpha/agents/{agent_id}/session/{session_id}": {
|
|
"get": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "A Session.",
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/Session"
|
|
}
|
|
}
|
|
}
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"Agents"
|
|
],
|
|
"summary": "Retrieve an agent session by its ID.",
|
|
"description": "Retrieve an agent session by its ID.",
|
|
"parameters": [
|
|
{
|
|
"name": "session_id",
|
|
"in": "path",
|
|
"description": "The ID of the session to get.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
},
|
|
{
|
|
"name": "agent_id",
|
|
"in": "path",
|
|
"description": "The ID of the agent to get the session for.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
},
|
|
{
|
|
"name": "turn_ids",
|
|
"in": "query",
|
|
"description": "(Optional) List of turn IDs to filter the session by.",
|
|
"required": false,
|
|
"schema": {
|
|
"type": "array",
|
|
"items": {
|
|
"type": "string"
|
|
}
|
|
}
|
|
}
|
|
],
|
|
"deprecated": false
|
|
},
|
|
"delete": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "OK"
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"Agents"
|
|
],
|
|
"summary": "Delete an agent session by its ID and its associated turns.",
|
|
"description": "Delete an agent session by its ID and its associated turns.",
|
|
"parameters": [
|
|
{
|
|
"name": "session_id",
|
|
"in": "path",
|
|
"description": "The ID of the session to delete.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
},
|
|
{
|
|
"name": "agent_id",
|
|
"in": "path",
|
|
"description": "The ID of the agent to delete the session for.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
}
|
|
],
|
|
"deprecated": false
|
|
}
|
|
},
|
|
"/v1alpha/agents/{agent_id}/session/{session_id}/turn": {
|
|
"post": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "If stream=False, returns a Turn object. If stream=True, returns an SSE event stream of AgentTurnResponseStreamChunk.",
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/Turn"
|
|
}
|
|
},
|
|
"text/event-stream": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/AgentTurnResponseStreamChunk"
|
|
}
|
|
}
|
|
}
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"Agents"
|
|
],
|
|
"summary": "Create a new turn for an agent.",
|
|
"description": "Create a new turn for an agent.",
|
|
"parameters": [
|
|
{
|
|
"name": "agent_id",
|
|
"in": "path",
|
|
"description": "The ID of the agent to create the turn for.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
},
|
|
{
|
|
"name": "session_id",
|
|
"in": "path",
|
|
"description": "The ID of the session to create the turn for.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
}
|
|
],
|
|
"requestBody": {
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/CreateAgentTurnRequest"
|
|
}
|
|
}
|
|
},
|
|
"required": true
|
|
},
|
|
"deprecated": false
|
|
}
|
|
},
|
|
"/v1alpha/agents/{agent_id}/session/{session_id}/turn/{turn_id}": {
|
|
"get": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "A Turn.",
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/Turn"
|
|
}
|
|
}
|
|
}
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"Agents"
|
|
],
|
|
"summary": "Retrieve an agent turn by its ID.",
|
|
"description": "Retrieve an agent turn by its ID.",
|
|
"parameters": [
|
|
{
|
|
"name": "agent_id",
|
|
"in": "path",
|
|
"description": "The ID of the agent to get the turn for.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
},
|
|
{
|
|
"name": "session_id",
|
|
"in": "path",
|
|
"description": "The ID of the session to get the turn for.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
},
|
|
{
|
|
"name": "turn_id",
|
|
"in": "path",
|
|
"description": "The ID of the turn to get.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
}
|
|
],
|
|
"deprecated": false
|
|
}
|
|
},
|
|
"/v1alpha/agents/{agent_id}/session/{session_id}/turn/{turn_id}/resume": {
|
|
"post": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "A Turn object if stream is False, otherwise an AsyncIterator of AgentTurnResponseStreamChunk objects.",
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/Turn"
|
|
}
|
|
},
|
|
"text/event-stream": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/AgentTurnResponseStreamChunk"
|
|
}
|
|
}
|
|
}
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"Agents"
|
|
],
|
|
"summary": "Resume an agent turn with executed tool call responses.",
|
|
"description": "Resume an agent turn with executed tool call responses.\nWhen a Turn has the status `awaiting_input` due to pending input from client side tool calls, this endpoint can be used to submit the outputs from the tool calls once they are ready.",
|
|
"parameters": [
|
|
{
|
|
"name": "agent_id",
|
|
"in": "path",
|
|
"description": "The ID of the agent to resume.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
},
|
|
{
|
|
"name": "session_id",
|
|
"in": "path",
|
|
"description": "The ID of the session to resume.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
},
|
|
{
|
|
"name": "turn_id",
|
|
"in": "path",
|
|
"description": "The ID of the turn to resume.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
}
|
|
],
|
|
"requestBody": {
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/ResumeAgentTurnRequest"
|
|
}
|
|
}
|
|
},
|
|
"required": true
|
|
},
|
|
"deprecated": false
|
|
}
|
|
},
|
|
"/v1alpha/agents/{agent_id}/session/{session_id}/turn/{turn_id}/step/{step_id}": {
|
|
"get": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "An AgentStepResponse.",
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/AgentStepResponse"
|
|
}
|
|
}
|
|
}
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"Agents"
|
|
],
|
|
"summary": "Retrieve an agent step by its ID.",
|
|
"description": "Retrieve an agent step by its ID.",
|
|
"parameters": [
|
|
{
|
|
"name": "agent_id",
|
|
"in": "path",
|
|
"description": "The ID of the agent to get the step for.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
},
|
|
{
|
|
"name": "session_id",
|
|
"in": "path",
|
|
"description": "The ID of the session to get the step for.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
},
|
|
{
|
|
"name": "turn_id",
|
|
"in": "path",
|
|
"description": "The ID of the turn to get the step for.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
},
|
|
{
|
|
"name": "step_id",
|
|
"in": "path",
|
|
"description": "The ID of the step to get.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
}
|
|
],
|
|
"deprecated": false
|
|
}
|
|
},
|
|
"/v1alpha/agents/{agent_id}/sessions": {
|
|
"get": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "A PaginatedResponse.",
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/PaginatedResponse"
|
|
}
|
|
}
|
|
}
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"Agents"
|
|
],
|
|
"summary": "List all session(s) of a given agent.",
|
|
"description": "List all session(s) of a given agent.",
|
|
"parameters": [
|
|
{
|
|
"name": "agent_id",
|
|
"in": "path",
|
|
"description": "The ID of the agent to list sessions for.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
},
|
|
{
|
|
"name": "start_index",
|
|
"in": "query",
|
|
"description": "The index to start the pagination from.",
|
|
"required": false,
|
|
"schema": {
|
|
"type": "integer"
|
|
}
|
|
},
|
|
{
|
|
"name": "limit",
|
|
"in": "query",
|
|
"description": "The number of sessions to return.",
|
|
"required": false,
|
|
"schema": {
|
|
"type": "integer"
|
|
}
|
|
}
|
|
],
|
|
"deprecated": false
|
|
}
|
|
},
|
|
"/v1alpha/eval/benchmarks": {
|
|
"get": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "A ListBenchmarksResponse.",
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/ListBenchmarksResponse"
|
|
}
|
|
}
|
|
}
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"Benchmarks"
|
|
],
|
|
"summary": "List all benchmarks.",
|
|
"description": "List all benchmarks.",
|
|
"parameters": [],
|
|
"deprecated": false
|
|
},
|
|
"post": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "OK"
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"Benchmarks"
|
|
],
|
|
"summary": "Register a benchmark.",
|
|
"description": "Register a benchmark.",
|
|
"parameters": [],
|
|
"requestBody": {
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/RegisterBenchmarkRequest"
|
|
}
|
|
}
|
|
},
|
|
"required": true
|
|
},
|
|
"deprecated": false
|
|
}
|
|
},
|
|
"/v1alpha/eval/benchmarks/{benchmark_id}": {
|
|
"get": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "A Benchmark.",
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/Benchmark"
|
|
}
|
|
}
|
|
}
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"Benchmarks"
|
|
],
|
|
"summary": "Get a benchmark by its ID.",
|
|
"description": "Get a benchmark by its ID.",
|
|
"parameters": [
|
|
{
|
|
"name": "benchmark_id",
|
|
"in": "path",
|
|
"description": "The ID of the benchmark to get.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
}
|
|
],
|
|
"deprecated": false
|
|
},
|
|
"delete": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "OK"
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"Benchmarks"
|
|
],
|
|
"summary": "Unregister a benchmark.",
|
|
"description": "Unregister a benchmark.",
|
|
"parameters": [
|
|
{
|
|
"name": "benchmark_id",
|
|
"in": "path",
|
|
"description": "The ID of the benchmark to unregister.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
}
|
|
],
|
|
"deprecated": false
|
|
}
|
|
},
|
|
"/v1alpha/eval/benchmarks/{benchmark_id}/evaluations": {
|
|
"post": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "EvaluateResponse object containing generations and scores.",
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/EvaluateResponse"
|
|
}
|
|
}
|
|
}
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"Eval"
|
|
],
|
|
"summary": "Evaluate a list of rows on a benchmark.",
|
|
"description": "Evaluate a list of rows on a benchmark.",
|
|
"parameters": [
|
|
{
|
|
"name": "benchmark_id",
|
|
"in": "path",
|
|
"description": "The ID of the benchmark to run the evaluation on.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
}
|
|
],
|
|
"requestBody": {
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/EvaluateRowsRequest"
|
|
}
|
|
}
|
|
},
|
|
"required": true
|
|
},
|
|
"deprecated": false
|
|
}
|
|
},
|
|
"/v1alpha/eval/benchmarks/{benchmark_id}/jobs": {
|
|
"post": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "The job that was created to run the evaluation.",
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/Job"
|
|
}
|
|
}
|
|
}
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"Eval"
|
|
],
|
|
"summary": "Run an evaluation on a benchmark.",
|
|
"description": "Run an evaluation on a benchmark.",
|
|
"parameters": [
|
|
{
|
|
"name": "benchmark_id",
|
|
"in": "path",
|
|
"description": "The ID of the benchmark to run the evaluation on.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
}
|
|
],
|
|
"requestBody": {
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/RunEvalRequest"
|
|
}
|
|
}
|
|
},
|
|
"required": true
|
|
},
|
|
"deprecated": false
|
|
}
|
|
},
|
|
"/v1alpha/eval/benchmarks/{benchmark_id}/jobs/{job_id}": {
|
|
"get": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "The status of the evaluation job.",
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/Job"
|
|
}
|
|
}
|
|
}
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"Eval"
|
|
],
|
|
"summary": "Get the status of a job.",
|
|
"description": "Get the status of a job.",
|
|
"parameters": [
|
|
{
|
|
"name": "benchmark_id",
|
|
"in": "path",
|
|
"description": "The ID of the benchmark to run the evaluation on.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
},
|
|
{
|
|
"name": "job_id",
|
|
"in": "path",
|
|
"description": "The ID of the job to get the status of.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
}
|
|
],
|
|
"deprecated": false
|
|
},
|
|
"delete": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "OK"
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"Eval"
|
|
],
|
|
"summary": "Cancel a job.",
|
|
"description": "Cancel a job.",
|
|
"parameters": [
|
|
{
|
|
"name": "benchmark_id",
|
|
"in": "path",
|
|
"description": "The ID of the benchmark to run the evaluation on.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
},
|
|
{
|
|
"name": "job_id",
|
|
"in": "path",
|
|
"description": "The ID of the job to cancel.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
}
|
|
],
|
|
"deprecated": false
|
|
}
|
|
},
|
|
"/v1alpha/eval/benchmarks/{benchmark_id}/jobs/{job_id}/result": {
|
|
"get": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "The result of the job.",
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/EvaluateResponse"
|
|
}
|
|
}
|
|
}
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"Eval"
|
|
],
|
|
"summary": "Get the result of a job.",
|
|
"description": "Get the result of a job.",
|
|
"parameters": [
|
|
{
|
|
"name": "benchmark_id",
|
|
"in": "path",
|
|
"description": "The ID of the benchmark to run the evaluation on.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
},
|
|
{
|
|
"name": "job_id",
|
|
"in": "path",
|
|
"description": "The ID of the job to get the result of.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
}
|
|
],
|
|
"deprecated": false
|
|
}
|
|
},
|
|
"/v1alpha/inference/rerank": {
|
|
"post": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "RerankResponse with indices sorted by relevance score (descending).",
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/RerankResponse"
|
|
}
|
|
}
|
|
}
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"Inference"
|
|
],
|
|
"summary": "Rerank a list of documents based on their relevance to a query.",
|
|
"description": "Rerank a list of documents based on their relevance to a query.",
|
|
"parameters": [],
|
|
"requestBody": {
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/RerankRequest"
|
|
}
|
|
}
|
|
},
|
|
"required": true
|
|
},
|
|
"deprecated": false
|
|
}
|
|
},
|
|
"/v1alpha/post-training/job/artifacts": {
|
|
"get": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "A PostTrainingJobArtifactsResponse.",
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/PostTrainingJobArtifactsResponse"
|
|
}
|
|
}
|
|
}
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"PostTraining (Coming Soon)"
|
|
],
|
|
"summary": "Get the artifacts of a training job.",
|
|
"description": "Get the artifacts of a training job.",
|
|
"parameters": [
|
|
{
|
|
"name": "job_uuid",
|
|
"in": "query",
|
|
"description": "The UUID of the job to get the artifacts of.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
}
|
|
],
|
|
"deprecated": false
|
|
}
|
|
},
|
|
"/v1alpha/post-training/job/cancel": {
|
|
"post": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "OK"
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"PostTraining (Coming Soon)"
|
|
],
|
|
"summary": "Cancel a training job.",
|
|
"description": "Cancel a training job.",
|
|
"parameters": [],
|
|
"requestBody": {
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/CancelTrainingJobRequest"
|
|
}
|
|
}
|
|
},
|
|
"required": true
|
|
},
|
|
"deprecated": false
|
|
}
|
|
},
|
|
"/v1alpha/post-training/job/status": {
|
|
"get": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "A PostTrainingJobStatusResponse.",
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/PostTrainingJobStatusResponse"
|
|
}
|
|
}
|
|
}
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"PostTraining (Coming Soon)"
|
|
],
|
|
"summary": "Get the status of a training job.",
|
|
"description": "Get the status of a training job.",
|
|
"parameters": [
|
|
{
|
|
"name": "job_uuid",
|
|
"in": "query",
|
|
"description": "The UUID of the job to get the status of.",
|
|
"required": true,
|
|
"schema": {
|
|
"type": "string"
|
|
}
|
|
}
|
|
],
|
|
"deprecated": false
|
|
}
|
|
},
|
|
"/v1alpha/post-training/jobs": {
|
|
"get": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "A ListPostTrainingJobsResponse.",
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/ListPostTrainingJobsResponse"
|
|
}
|
|
}
|
|
}
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"PostTraining (Coming Soon)"
|
|
],
|
|
"summary": "Get all training jobs.",
|
|
"description": "Get all training jobs.",
|
|
"parameters": [],
|
|
"deprecated": false
|
|
}
|
|
},
|
|
"/v1alpha/post-training/preference-optimize": {
|
|
"post": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "A PostTrainingJob.",
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/PostTrainingJob"
|
|
}
|
|
}
|
|
}
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"PostTraining (Coming Soon)"
|
|
],
|
|
"summary": "Run preference optimization of a model.",
|
|
"description": "Run preference optimization of a model.",
|
|
"parameters": [],
|
|
"requestBody": {
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/PreferenceOptimizeRequest"
|
|
}
|
|
}
|
|
},
|
|
"required": true
|
|
},
|
|
"deprecated": false
|
|
}
|
|
},
|
|
"/v1alpha/post-training/supervised-fine-tune": {
|
|
"post": {
|
|
"responses": {
|
|
"200": {
|
|
"description": "A PostTrainingJob.",
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/PostTrainingJob"
|
|
}
|
|
}
|
|
}
|
|
},
|
|
"400": {
|
|
"$ref": "#/components/responses/BadRequest400"
|
|
},
|
|
"429": {
|
|
"$ref": "#/components/responses/TooManyRequests429"
|
|
},
|
|
"500": {
|
|
"$ref": "#/components/responses/InternalServerError500"
|
|
},
|
|
"default": {
|
|
"$ref": "#/components/responses/DefaultError"
|
|
}
|
|
},
|
|
"tags": [
|
|
"PostTraining (Coming Soon)"
|
|
],
|
|
"summary": "Run supervised fine-tuning of a model.",
|
|
"description": "Run supervised fine-tuning of a model.",
|
|
"parameters": [],
|
|
"requestBody": {
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/SupervisedFineTuneRequest"
|
|
}
|
|
}
|
|
},
|
|
"required": true
|
|
},
|
|
"deprecated": false
|
|
}
|
|
}
|
|
},
|
|
"jsonSchemaDialect": "https://json-schema.org/draft/2020-12/schema",
|
|
"components": {
|
|
"schemas": {
|
|
"Error": {
|
|
"type": "object",
|
|
"properties": {
|
|
"status": {
|
|
"type": "integer",
|
|
"description": "HTTP status code"
|
|
},
|
|
"title": {
|
|
"type": "string",
|
|
"description": "Error title, a short summary of the error which is invariant for an error type"
|
|
},
|
|
"detail": {
|
|
"type": "string",
|
|
"description": "Error detail, a longer human-readable description of the error"
|
|
},
|
|
"instance": {
|
|
"type": "string",
|
|
"description": "(Optional) A URL which can be used to retrieve more information about the specific occurrence of the error"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"status",
|
|
"title",
|
|
"detail"
|
|
],
|
|
"title": "Error",
|
|
"description": "Error response from the API. Roughly follows RFC 7807."
|
|
},
|
|
"AppendRowsRequest": {
|
|
"type": "object",
|
|
"properties": {
|
|
"rows": {
|
|
"type": "array",
|
|
"items": {
|
|
"type": "object",
|
|
"additionalProperties": {
|
|
"oneOf": [
|
|
{
|
|
"type": "null"
|
|
},
|
|
{
|
|
"type": "boolean"
|
|
},
|
|
{
|
|
"type": "number"
|
|
},
|
|
{
|
|
"type": "string"
|
|
},
|
|
{
|
|
"type": "array"
|
|
},
|
|
{
|
|
"type": "object"
|
|
}
|
|
]
|
|
}
|
|
},
|
|
"description": "The rows to append to the dataset."
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"rows"
|
|
],
|
|
"title": "AppendRowsRequest"
|
|
},
|
|
"PaginatedResponse": {
|
|
"type": "object",
|
|
"properties": {
|
|
"data": {
|
|
"type": "array",
|
|
"items": {
|
|
"type": "object",
|
|
"additionalProperties": {
|
|
"oneOf": [
|
|
{
|
|
"type": "null"
|
|
},
|
|
{
|
|
"type": "boolean"
|
|
},
|
|
{
|
|
"type": "number"
|
|
},
|
|
{
|
|
"type": "string"
|
|
},
|
|
{
|
|
"type": "array"
|
|
},
|
|
{
|
|
"type": "object"
|
|
}
|
|
]
|
|
}
|
|
},
|
|
"description": "The list of items for the current page"
|
|
},
|
|
"has_more": {
|
|
"type": "boolean",
|
|
"description": "Whether there are more items available after this set"
|
|
},
|
|
"url": {
|
|
"type": "string",
|
|
"description": "The URL for accessing this list"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"data",
|
|
"has_more"
|
|
],
|
|
"title": "PaginatedResponse",
|
|
"description": "A generic paginated response that follows a simple format."
|
|
},
|
|
"Dataset": {
|
|
"type": "object",
|
|
"properties": {
|
|
"identifier": {
|
|
"type": "string"
|
|
},
|
|
"provider_resource_id": {
|
|
"type": "string"
|
|
},
|
|
"provider_id": {
|
|
"type": "string"
|
|
},
|
|
"type": {
|
|
"type": "string",
|
|
"enum": [
|
|
"model",
|
|
"shield",
|
|
"vector_store",
|
|
"dataset",
|
|
"scoring_function",
|
|
"benchmark",
|
|
"tool",
|
|
"tool_group",
|
|
"prompt"
|
|
],
|
|
"const": "dataset",
|
|
"default": "dataset",
|
|
"description": "Type of resource, always 'dataset' for datasets"
|
|
},
|
|
"purpose": {
|
|
"type": "string",
|
|
"enum": [
|
|
"post-training/messages",
|
|
"eval/question-answer",
|
|
"eval/messages-answer"
|
|
],
|
|
"description": "Purpose of the dataset indicating its intended use"
|
|
},
|
|
"source": {
|
|
"oneOf": [
|
|
{
|
|
"$ref": "#/components/schemas/URIDataSource"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/RowsDataSource"
|
|
}
|
|
],
|
|
"discriminator": {
|
|
"propertyName": "type",
|
|
"mapping": {
|
|
"uri": "#/components/schemas/URIDataSource",
|
|
"rows": "#/components/schemas/RowsDataSource"
|
|
}
|
|
},
|
|
"description": "Data source configuration for the dataset"
|
|
},
|
|
"metadata": {
|
|
"type": "object",
|
|
"additionalProperties": {
|
|
"oneOf": [
|
|
{
|
|
"type": "null"
|
|
},
|
|
{
|
|
"type": "boolean"
|
|
},
|
|
{
|
|
"type": "number"
|
|
},
|
|
{
|
|
"type": "string"
|
|
},
|
|
{
|
|
"type": "array"
|
|
},
|
|
{
|
|
"type": "object"
|
|
}
|
|
]
|
|
},
|
|
"description": "Additional metadata for the dataset"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"identifier",
|
|
"provider_id",
|
|
"type",
|
|
"purpose",
|
|
"source",
|
|
"metadata"
|
|
],
|
|
"title": "Dataset",
|
|
"description": "Dataset resource for storing and accessing training or evaluation data."
|
|
},
|
|
"RowsDataSource": {
|
|
"type": "object",
|
|
"properties": {
|
|
"type": {
|
|
"type": "string",
|
|
"const": "rows",
|
|
"default": "rows"
|
|
},
|
|
"rows": {
|
|
"type": "array",
|
|
"items": {
|
|
"type": "object",
|
|
"additionalProperties": {
|
|
"oneOf": [
|
|
{
|
|
"type": "null"
|
|
},
|
|
{
|
|
"type": "boolean"
|
|
},
|
|
{
|
|
"type": "number"
|
|
},
|
|
{
|
|
"type": "string"
|
|
},
|
|
{
|
|
"type": "array"
|
|
},
|
|
{
|
|
"type": "object"
|
|
}
|
|
]
|
|
}
|
|
},
|
|
"description": "The dataset is stored in rows. E.g. - [ {\"messages\": [{\"role\": \"user\", \"content\": \"Hello, world!\"}, {\"role\": \"assistant\", \"content\": \"Hello, world!\"}]} ]"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"type",
|
|
"rows"
|
|
],
|
|
"title": "RowsDataSource",
|
|
"description": "A dataset stored in rows."
|
|
},
|
|
"URIDataSource": {
|
|
"type": "object",
|
|
"properties": {
|
|
"type": {
|
|
"type": "string",
|
|
"const": "uri",
|
|
"default": "uri"
|
|
},
|
|
"uri": {
|
|
"type": "string",
|
|
"description": "The dataset can be obtained from a URI. E.g. - \"https://mywebsite.com/mydata.jsonl\" - \"lsfs://mydata.jsonl\" - \"data:csv;base64,{base64_content}\""
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"type",
|
|
"uri"
|
|
],
|
|
"title": "URIDataSource",
|
|
"description": "A dataset that can be obtained from a URI."
|
|
},
|
|
"ListDatasetsResponse": {
|
|
"type": "object",
|
|
"properties": {
|
|
"data": {
|
|
"type": "array",
|
|
"items": {
|
|
"$ref": "#/components/schemas/Dataset"
|
|
},
|
|
"description": "List of datasets"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"data"
|
|
],
|
|
"title": "ListDatasetsResponse",
|
|
"description": "Response from listing datasets."
|
|
},
|
|
"DataSource": {
|
|
"oneOf": [
|
|
{
|
|
"$ref": "#/components/schemas/URIDataSource"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/RowsDataSource"
|
|
}
|
|
],
|
|
"discriminator": {
|
|
"propertyName": "type",
|
|
"mapping": {
|
|
"uri": "#/components/schemas/URIDataSource",
|
|
"rows": "#/components/schemas/RowsDataSource"
|
|
}
|
|
}
|
|
},
|
|
"RegisterDatasetRequest": {
|
|
"type": "object",
|
|
"properties": {
|
|
"purpose": {
|
|
"type": "string",
|
|
"enum": [
|
|
"post-training/messages",
|
|
"eval/question-answer",
|
|
"eval/messages-answer"
|
|
],
|
|
"description": "The purpose of the dataset. One of: - \"post-training/messages\": The dataset contains a messages column with list of messages for post-training. { \"messages\": [ {\"role\": \"user\", \"content\": \"Hello, world!\"}, {\"role\": \"assistant\", \"content\": \"Hello, world!\"}, ] } - \"eval/question-answer\": The dataset contains a question column and an answer column for evaluation. { \"question\": \"What is the capital of France?\", \"answer\": \"Paris\" } - \"eval/messages-answer\": The dataset contains a messages column with list of messages and an answer column for evaluation. { \"messages\": [ {\"role\": \"user\", \"content\": \"Hello, my name is John Doe.\"}, {\"role\": \"assistant\", \"content\": \"Hello, John Doe. How can I help you today?\"}, {\"role\": \"user\", \"content\": \"What's my name?\"}, ], \"answer\": \"John Doe\" }"
|
|
},
|
|
"source": {
|
|
"$ref": "#/components/schemas/DataSource",
|
|
"description": "The data source of the dataset. Ensure that the data source schema is compatible with the purpose of the dataset. Examples: - { \"type\": \"uri\", \"uri\": \"https://mywebsite.com/mydata.jsonl\" } - { \"type\": \"uri\", \"uri\": \"lsfs://mydata.jsonl\" } - { \"type\": \"uri\", \"uri\": \"data:csv;base64,{base64_content}\" } - { \"type\": \"uri\", \"uri\": \"huggingface://llamastack/simpleqa?split=train\" } - { \"type\": \"rows\", \"rows\": [ { \"messages\": [ {\"role\": \"user\", \"content\": \"Hello, world!\"}, {\"role\": \"assistant\", \"content\": \"Hello, world!\"}, ] } ] }"
|
|
},
|
|
"metadata": {
|
|
"type": "object",
|
|
"additionalProperties": {
|
|
"oneOf": [
|
|
{
|
|
"type": "null"
|
|
},
|
|
{
|
|
"type": "boolean"
|
|
},
|
|
{
|
|
"type": "number"
|
|
},
|
|
{
|
|
"type": "string"
|
|
},
|
|
{
|
|
"type": "array"
|
|
},
|
|
{
|
|
"type": "object"
|
|
}
|
|
]
|
|
},
|
|
"description": "The metadata for the dataset. - E.g. {\"description\": \"My dataset\"}."
|
|
},
|
|
"dataset_id": {
|
|
"type": "string",
|
|
"description": "The ID of the dataset. If not provided, an ID will be generated."
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"purpose",
|
|
"source"
|
|
],
|
|
"title": "RegisterDatasetRequest"
|
|
},
|
|
"AgentConfig": {
|
|
"type": "object",
|
|
"properties": {
|
|
"sampling_params": {
|
|
"$ref": "#/components/schemas/SamplingParams"
|
|
},
|
|
"input_shields": {
|
|
"type": "array",
|
|
"items": {
|
|
"type": "string"
|
|
}
|
|
},
|
|
"output_shields": {
|
|
"type": "array",
|
|
"items": {
|
|
"type": "string"
|
|
}
|
|
},
|
|
"toolgroups": {
|
|
"type": "array",
|
|
"items": {
|
|
"$ref": "#/components/schemas/AgentTool"
|
|
}
|
|
},
|
|
"client_tools": {
|
|
"type": "array",
|
|
"items": {
|
|
"$ref": "#/components/schemas/ToolDef"
|
|
}
|
|
},
|
|
"tool_choice": {
|
|
"type": "string",
|
|
"enum": [
|
|
"auto",
|
|
"required",
|
|
"none"
|
|
],
|
|
"title": "ToolChoice",
|
|
"description": "Whether tool use is required or automatic. This is a hint to the model which may not be followed. It depends on the Instruction Following capabilities of the model.",
|
|
"deprecated": true
|
|
},
|
|
"tool_prompt_format": {
|
|
"type": "string",
|
|
"enum": [
|
|
"json",
|
|
"function_tag",
|
|
"python_list"
|
|
],
|
|
"title": "ToolPromptFormat",
|
|
"description": "Prompt format for calling custom / zero shot tools.",
|
|
"deprecated": true
|
|
},
|
|
"tool_config": {
|
|
"$ref": "#/components/schemas/ToolConfig"
|
|
},
|
|
"max_infer_iters": {
|
|
"type": "integer",
|
|
"default": 10
|
|
},
|
|
"model": {
|
|
"type": "string",
|
|
"description": "The model identifier to use for the agent"
|
|
},
|
|
"instructions": {
|
|
"type": "string",
|
|
"description": "The system instructions for the agent"
|
|
},
|
|
"name": {
|
|
"type": "string",
|
|
"description": "Optional name for the agent, used in telemetry and identification"
|
|
},
|
|
"enable_session_persistence": {
|
|
"type": "boolean",
|
|
"default": false,
|
|
"description": "Optional flag indicating whether session data has to be persisted"
|
|
},
|
|
"response_format": {
|
|
"$ref": "#/components/schemas/ResponseFormat",
|
|
"description": "Optional response format configuration"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"model",
|
|
"instructions"
|
|
],
|
|
"title": "AgentConfig",
|
|
"description": "Configuration for an agent."
|
|
},
|
|
"AgentTool": {
|
|
"oneOf": [
|
|
{
|
|
"type": "string"
|
|
},
|
|
{
|
|
"type": "object",
|
|
"properties": {
|
|
"name": {
|
|
"type": "string"
|
|
},
|
|
"args": {
|
|
"type": "object",
|
|
"additionalProperties": {
|
|
"oneOf": [
|
|
{
|
|
"type": "null"
|
|
},
|
|
{
|
|
"type": "boolean"
|
|
},
|
|
{
|
|
"type": "number"
|
|
},
|
|
{
|
|
"type": "string"
|
|
},
|
|
{
|
|
"type": "array"
|
|
},
|
|
{
|
|
"type": "object"
|
|
}
|
|
]
|
|
}
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"name",
|
|
"args"
|
|
],
|
|
"title": "AgentToolGroupWithArgs"
|
|
}
|
|
]
|
|
},
|
|
"GrammarResponseFormat": {
|
|
"type": "object",
|
|
"properties": {
|
|
"type": {
|
|
"type": "string",
|
|
"enum": [
|
|
"json_schema",
|
|
"grammar"
|
|
],
|
|
"description": "Must be \"grammar\" to identify this format type",
|
|
"const": "grammar",
|
|
"default": "grammar"
|
|
},
|
|
"bnf": {
|
|
"type": "object",
|
|
"additionalProperties": {
|
|
"oneOf": [
|
|
{
|
|
"type": "null"
|
|
},
|
|
{
|
|
"type": "boolean"
|
|
},
|
|
{
|
|
"type": "number"
|
|
},
|
|
{
|
|
"type": "string"
|
|
},
|
|
{
|
|
"type": "array"
|
|
},
|
|
{
|
|
"type": "object"
|
|
}
|
|
]
|
|
},
|
|
"description": "The BNF grammar specification the response should conform to"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"type",
|
|
"bnf"
|
|
],
|
|
"title": "GrammarResponseFormat",
|
|
"description": "Configuration for grammar-guided response generation."
|
|
},
|
|
"GreedySamplingStrategy": {
|
|
"type": "object",
|
|
"properties": {
|
|
"type": {
|
|
"type": "string",
|
|
"const": "greedy",
|
|
"default": "greedy",
|
|
"description": "Must be \"greedy\" to identify this sampling strategy"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"type"
|
|
],
|
|
"title": "GreedySamplingStrategy",
|
|
"description": "Greedy sampling strategy that selects the highest probability token at each step."
|
|
},
|
|
"JsonSchemaResponseFormat": {
|
|
"type": "object",
|
|
"properties": {
|
|
"type": {
|
|
"type": "string",
|
|
"enum": [
|
|
"json_schema",
|
|
"grammar"
|
|
],
|
|
"description": "Must be \"json_schema\" to identify this format type",
|
|
"const": "json_schema",
|
|
"default": "json_schema"
|
|
},
|
|
"json_schema": {
|
|
"type": "object",
|
|
"additionalProperties": {
|
|
"oneOf": [
|
|
{
|
|
"type": "null"
|
|
},
|
|
{
|
|
"type": "boolean"
|
|
},
|
|
{
|
|
"type": "number"
|
|
},
|
|
{
|
|
"type": "string"
|
|
},
|
|
{
|
|
"type": "array"
|
|
},
|
|
{
|
|
"type": "object"
|
|
}
|
|
]
|
|
},
|
|
"description": "The JSON schema the response should conform to. In a Python SDK, this is often a `pydantic` model."
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"type",
|
|
"json_schema"
|
|
],
|
|
"title": "JsonSchemaResponseFormat",
|
|
"description": "Configuration for JSON schema-guided response generation."
|
|
},
|
|
"ResponseFormat": {
|
|
"oneOf": [
|
|
{
|
|
"$ref": "#/components/schemas/JsonSchemaResponseFormat"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/GrammarResponseFormat"
|
|
}
|
|
],
|
|
"discriminator": {
|
|
"propertyName": "type",
|
|
"mapping": {
|
|
"json_schema": "#/components/schemas/JsonSchemaResponseFormat",
|
|
"grammar": "#/components/schemas/GrammarResponseFormat"
|
|
}
|
|
}
|
|
},
|
|
"SamplingParams": {
|
|
"type": "object",
|
|
"properties": {
|
|
"strategy": {
|
|
"oneOf": [
|
|
{
|
|
"$ref": "#/components/schemas/GreedySamplingStrategy"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/TopPSamplingStrategy"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/TopKSamplingStrategy"
|
|
}
|
|
],
|
|
"discriminator": {
|
|
"propertyName": "type",
|
|
"mapping": {
|
|
"greedy": "#/components/schemas/GreedySamplingStrategy",
|
|
"top_p": "#/components/schemas/TopPSamplingStrategy",
|
|
"top_k": "#/components/schemas/TopKSamplingStrategy"
|
|
}
|
|
},
|
|
"description": "The sampling strategy."
|
|
},
|
|
"max_tokens": {
|
|
"type": "integer",
|
|
"default": 0,
|
|
"description": "The maximum number of tokens that can be generated in the completion. The token count of your prompt plus max_tokens cannot exceed the model's context length."
|
|
},
|
|
"repetition_penalty": {
|
|
"type": "number",
|
|
"default": 1.0,
|
|
"description": "Number between -2.0 and 2.0. Positive values penalize new tokens based on whether they appear in the text so far, increasing the model's likelihood to talk about new topics."
|
|
},
|
|
"stop": {
|
|
"type": "array",
|
|
"items": {
|
|
"type": "string"
|
|
},
|
|
"description": "Up to 4 sequences where the API will stop generating further tokens. The returned text will not contain the stop sequence."
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"strategy"
|
|
],
|
|
"title": "SamplingParams",
|
|
"description": "Sampling parameters."
|
|
},
|
|
"ToolConfig": {
|
|
"type": "object",
|
|
"properties": {
|
|
"tool_choice": {
|
|
"oneOf": [
|
|
{
|
|
"type": "string",
|
|
"enum": [
|
|
"auto",
|
|
"required",
|
|
"none"
|
|
],
|
|
"title": "ToolChoice",
|
|
"description": "Whether tool use is required or automatic. This is a hint to the model which may not be followed. It depends on the Instruction Following capabilities of the model."
|
|
},
|
|
{
|
|
"type": "string"
|
|
}
|
|
],
|
|
"default": "auto",
|
|
"description": "(Optional) Whether tool use is automatic, required, or none. Can also specify a tool name to use a specific tool. Defaults to ToolChoice.auto."
|
|
},
|
|
"tool_prompt_format": {
|
|
"type": "string",
|
|
"enum": [
|
|
"json",
|
|
"function_tag",
|
|
"python_list"
|
|
],
|
|
"description": "(Optional) Instructs the model how to format tool calls. By default, Llama Stack will attempt to use a format that is best adapted to the model. - `ToolPromptFormat.json`: The tool calls are formatted as a JSON object. - `ToolPromptFormat.function_tag`: The tool calls are enclosed in a <function=function_name> tag. - `ToolPromptFormat.python_list`: The tool calls are output as Python syntax -- a list of function calls."
|
|
},
|
|
"system_message_behavior": {
|
|
"type": "string",
|
|
"enum": [
|
|
"append",
|
|
"replace"
|
|
],
|
|
"description": "(Optional) Config for how to override the default system prompt. - `SystemMessageBehavior.append`: Appends the provided system message to the default system prompt. - `SystemMessageBehavior.replace`: Replaces the default system prompt with the provided system message. The system message can include the string '{{function_definitions}}' to indicate where the function definitions should be inserted.",
|
|
"default": "append"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"title": "ToolConfig",
|
|
"description": "Configuration for tool use."
|
|
},
|
|
"ToolDef": {
|
|
"type": "object",
|
|
"properties": {
|
|
"toolgroup_id": {
|
|
"type": "string",
|
|
"description": "(Optional) ID of the tool group this tool belongs to"
|
|
},
|
|
"name": {
|
|
"type": "string",
|
|
"description": "Name of the tool"
|
|
},
|
|
"description": {
|
|
"type": "string",
|
|
"description": "(Optional) Human-readable description of what the tool does"
|
|
},
|
|
"input_schema": {
|
|
"type": "object",
|
|
"additionalProperties": {
|
|
"oneOf": [
|
|
{
|
|
"type": "null"
|
|
},
|
|
{
|
|
"type": "boolean"
|
|
},
|
|
{
|
|
"type": "number"
|
|
},
|
|
{
|
|
"type": "string"
|
|
},
|
|
{
|
|
"type": "array"
|
|
},
|
|
{
|
|
"type": "object"
|
|
}
|
|
]
|
|
},
|
|
"description": "(Optional) JSON Schema for tool inputs (MCP inputSchema)"
|
|
},
|
|
"output_schema": {
|
|
"type": "object",
|
|
"additionalProperties": {
|
|
"oneOf": [
|
|
{
|
|
"type": "null"
|
|
},
|
|
{
|
|
"type": "boolean"
|
|
},
|
|
{
|
|
"type": "number"
|
|
},
|
|
{
|
|
"type": "string"
|
|
},
|
|
{
|
|
"type": "array"
|
|
},
|
|
{
|
|
"type": "object"
|
|
}
|
|
]
|
|
},
|
|
"description": "(Optional) JSON Schema for tool outputs (MCP outputSchema)"
|
|
},
|
|
"metadata": {
|
|
"type": "object",
|
|
"additionalProperties": {
|
|
"oneOf": [
|
|
{
|
|
"type": "null"
|
|
},
|
|
{
|
|
"type": "boolean"
|
|
},
|
|
{
|
|
"type": "number"
|
|
},
|
|
{
|
|
"type": "string"
|
|
},
|
|
{
|
|
"type": "array"
|
|
},
|
|
{
|
|
"type": "object"
|
|
}
|
|
]
|
|
},
|
|
"description": "(Optional) Additional metadata about the tool"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"name"
|
|
],
|
|
"title": "ToolDef",
|
|
"description": "Tool definition used in runtime contexts."
|
|
},
|
|
"TopKSamplingStrategy": {
|
|
"type": "object",
|
|
"properties": {
|
|
"type": {
|
|
"type": "string",
|
|
"const": "top_k",
|
|
"default": "top_k",
|
|
"description": "Must be \"top_k\" to identify this sampling strategy"
|
|
},
|
|
"top_k": {
|
|
"type": "integer",
|
|
"description": "Number of top tokens to consider for sampling. Must be at least 1"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"type",
|
|
"top_k"
|
|
],
|
|
"title": "TopKSamplingStrategy",
|
|
"description": "Top-k sampling strategy that restricts sampling to the k most likely tokens."
|
|
},
|
|
"TopPSamplingStrategy": {
|
|
"type": "object",
|
|
"properties": {
|
|
"type": {
|
|
"type": "string",
|
|
"const": "top_p",
|
|
"default": "top_p",
|
|
"description": "Must be \"top_p\" to identify this sampling strategy"
|
|
},
|
|
"temperature": {
|
|
"type": "number",
|
|
"description": "Controls randomness in sampling. Higher values increase randomness"
|
|
},
|
|
"top_p": {
|
|
"type": "number",
|
|
"default": 0.95,
|
|
"description": "Cumulative probability threshold for nucleus sampling. Defaults to 0.95"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"type"
|
|
],
|
|
"title": "TopPSamplingStrategy",
|
|
"description": "Top-p (nucleus) sampling strategy that samples from the smallest set of tokens with cumulative probability >= p."
|
|
},
|
|
"CreateAgentRequest": {
|
|
"type": "object",
|
|
"properties": {
|
|
"agent_config": {
|
|
"$ref": "#/components/schemas/AgentConfig",
|
|
"description": "The configuration for the agent."
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"agent_config"
|
|
],
|
|
"title": "CreateAgentRequest"
|
|
},
|
|
"AgentCreateResponse": {
|
|
"type": "object",
|
|
"properties": {
|
|
"agent_id": {
|
|
"type": "string",
|
|
"description": "Unique identifier for the created agent"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"agent_id"
|
|
],
|
|
"title": "AgentCreateResponse",
|
|
"description": "Response returned when creating a new agent."
|
|
},
|
|
"Agent": {
|
|
"type": "object",
|
|
"properties": {
|
|
"agent_id": {
|
|
"type": "string",
|
|
"description": "Unique identifier for the agent"
|
|
},
|
|
"agent_config": {
|
|
"$ref": "#/components/schemas/AgentConfig",
|
|
"description": "Configuration settings for the agent"
|
|
},
|
|
"created_at": {
|
|
"type": "string",
|
|
"format": "date-time",
|
|
"description": "Timestamp when the agent was created"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"agent_id",
|
|
"agent_config",
|
|
"created_at"
|
|
],
|
|
"title": "Agent",
|
|
"description": "An agent instance with configuration and metadata."
|
|
},
|
|
"CreateAgentSessionRequest": {
|
|
"type": "object",
|
|
"properties": {
|
|
"session_name": {
|
|
"type": "string",
|
|
"description": "The name of the session to create."
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"session_name"
|
|
],
|
|
"title": "CreateAgentSessionRequest"
|
|
},
|
|
"AgentSessionCreateResponse": {
|
|
"type": "object",
|
|
"properties": {
|
|
"session_id": {
|
|
"type": "string",
|
|
"description": "Unique identifier for the created session"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"session_id"
|
|
],
|
|
"title": "AgentSessionCreateResponse",
|
|
"description": "Response returned when creating a new agent session."
|
|
},
|
|
"CompletionMessage": {
|
|
"type": "object",
|
|
"properties": {
|
|
"role": {
|
|
"type": "string",
|
|
"const": "assistant",
|
|
"default": "assistant",
|
|
"description": "Must be \"assistant\" to identify this as the model's response"
|
|
},
|
|
"content": {
|
|
"$ref": "#/components/schemas/InterleavedContent",
|
|
"description": "The content of the model's response"
|
|
},
|
|
"stop_reason": {
|
|
"type": "string",
|
|
"enum": [
|
|
"end_of_turn",
|
|
"end_of_message",
|
|
"out_of_tokens"
|
|
],
|
|
"description": "Reason why the model stopped generating. Options are: - `StopReason.end_of_turn`: The model finished generating the entire response. - `StopReason.end_of_message`: The model finished generating but generated a partial response -- usually, a tool call. The user may call the tool and continue the conversation with the tool's response. - `StopReason.out_of_tokens`: The model ran out of token budget."
|
|
},
|
|
"tool_calls": {
|
|
"type": "array",
|
|
"items": {
|
|
"$ref": "#/components/schemas/ToolCall"
|
|
},
|
|
"description": "List of tool calls. Each tool call is a ToolCall object."
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"role",
|
|
"content",
|
|
"stop_reason"
|
|
],
|
|
"title": "CompletionMessage",
|
|
"description": "A message containing the model's (assistant) response in a chat conversation."
|
|
},
|
|
"ImageContentItem": {
|
|
"type": "object",
|
|
"properties": {
|
|
"type": {
|
|
"type": "string",
|
|
"const": "image",
|
|
"default": "image",
|
|
"description": "Discriminator type of the content item. Always \"image\""
|
|
},
|
|
"image": {
|
|
"type": "object",
|
|
"properties": {
|
|
"url": {
|
|
"$ref": "#/components/schemas/URL",
|
|
"description": "A URL of the image or data URL in the format of data:image/{type};base64,{data}. Note that URL could have length limits."
|
|
},
|
|
"data": {
|
|
"type": "string",
|
|
"contentEncoding": "base64",
|
|
"description": "base64 encoded image data as string"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"description": "Image as a base64 encoded string or an URL"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"type",
|
|
"image"
|
|
],
|
|
"title": "ImageContentItem",
|
|
"description": "A image content item"
|
|
},
|
|
"InferenceStep": {
|
|
"type": "object",
|
|
"properties": {
|
|
"turn_id": {
|
|
"type": "string",
|
|
"description": "The ID of the turn."
|
|
},
|
|
"step_id": {
|
|
"type": "string",
|
|
"description": "The ID of the step."
|
|
},
|
|
"started_at": {
|
|
"type": "string",
|
|
"format": "date-time",
|
|
"description": "The time the step started."
|
|
},
|
|
"completed_at": {
|
|
"type": "string",
|
|
"format": "date-time",
|
|
"description": "The time the step completed."
|
|
},
|
|
"step_type": {
|
|
"type": "string",
|
|
"enum": [
|
|
"inference",
|
|
"tool_execution",
|
|
"shield_call",
|
|
"memory_retrieval"
|
|
],
|
|
"title": "StepType",
|
|
"description": "Type of the step in an agent turn.",
|
|
"const": "inference",
|
|
"default": "inference"
|
|
},
|
|
"model_response": {
|
|
"$ref": "#/components/schemas/CompletionMessage",
|
|
"description": "The response from the LLM."
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"turn_id",
|
|
"step_id",
|
|
"step_type",
|
|
"model_response"
|
|
],
|
|
"title": "InferenceStep",
|
|
"description": "An inference step in an agent turn."
|
|
},
|
|
"InterleavedContent": {
|
|
"oneOf": [
|
|
{
|
|
"type": "string"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/InterleavedContentItem"
|
|
},
|
|
{
|
|
"type": "array",
|
|
"items": {
|
|
"$ref": "#/components/schemas/InterleavedContentItem"
|
|
}
|
|
}
|
|
]
|
|
},
|
|
"InterleavedContentItem": {
|
|
"oneOf": [
|
|
{
|
|
"$ref": "#/components/schemas/ImageContentItem"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/TextContentItem"
|
|
}
|
|
],
|
|
"discriminator": {
|
|
"propertyName": "type",
|
|
"mapping": {
|
|
"image": "#/components/schemas/ImageContentItem",
|
|
"text": "#/components/schemas/TextContentItem"
|
|
}
|
|
}
|
|
},
|
|
"MemoryRetrievalStep": {
|
|
"type": "object",
|
|
"properties": {
|
|
"turn_id": {
|
|
"type": "string",
|
|
"description": "The ID of the turn."
|
|
},
|
|
"step_id": {
|
|
"type": "string",
|
|
"description": "The ID of the step."
|
|
},
|
|
"started_at": {
|
|
"type": "string",
|
|
"format": "date-time",
|
|
"description": "The time the step started."
|
|
},
|
|
"completed_at": {
|
|
"type": "string",
|
|
"format": "date-time",
|
|
"description": "The time the step completed."
|
|
},
|
|
"step_type": {
|
|
"type": "string",
|
|
"enum": [
|
|
"inference",
|
|
"tool_execution",
|
|
"shield_call",
|
|
"memory_retrieval"
|
|
],
|
|
"title": "StepType",
|
|
"description": "Type of the step in an agent turn.",
|
|
"const": "memory_retrieval",
|
|
"default": "memory_retrieval"
|
|
},
|
|
"vector_db_ids": {
|
|
"type": "string",
|
|
"description": "The IDs of the vector databases to retrieve context from."
|
|
},
|
|
"inserted_context": {
|
|
"$ref": "#/components/schemas/InterleavedContent",
|
|
"description": "The context retrieved from the vector databases."
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"turn_id",
|
|
"step_id",
|
|
"step_type",
|
|
"vector_db_ids",
|
|
"inserted_context"
|
|
],
|
|
"title": "MemoryRetrievalStep",
|
|
"description": "A memory retrieval step in an agent turn."
|
|
},
|
|
"SafetyViolation": {
|
|
"type": "object",
|
|
"properties": {
|
|
"violation_level": {
|
|
"$ref": "#/components/schemas/ViolationLevel",
|
|
"description": "Severity level of the violation"
|
|
},
|
|
"user_message": {
|
|
"type": "string",
|
|
"description": "(Optional) Message to convey to the user about the violation"
|
|
},
|
|
"metadata": {
|
|
"type": "object",
|
|
"additionalProperties": {
|
|
"oneOf": [
|
|
{
|
|
"type": "null"
|
|
},
|
|
{
|
|
"type": "boolean"
|
|
},
|
|
{
|
|
"type": "number"
|
|
},
|
|
{
|
|
"type": "string"
|
|
},
|
|
{
|
|
"type": "array"
|
|
},
|
|
{
|
|
"type": "object"
|
|
}
|
|
]
|
|
},
|
|
"description": "Additional metadata including specific violation codes for debugging and telemetry"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"violation_level",
|
|
"metadata"
|
|
],
|
|
"title": "SafetyViolation",
|
|
"description": "Details of a safety violation detected by content moderation."
|
|
},
|
|
"Session": {
|
|
"type": "object",
|
|
"properties": {
|
|
"session_id": {
|
|
"type": "string",
|
|
"description": "Unique identifier for the conversation session"
|
|
},
|
|
"session_name": {
|
|
"type": "string",
|
|
"description": "Human-readable name for the session"
|
|
},
|
|
"turns": {
|
|
"type": "array",
|
|
"items": {
|
|
"$ref": "#/components/schemas/Turn"
|
|
},
|
|
"description": "List of all turns that have occurred in this session"
|
|
},
|
|
"started_at": {
|
|
"type": "string",
|
|
"format": "date-time",
|
|
"description": "Timestamp when the session was created"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"session_id",
|
|
"session_name",
|
|
"turns",
|
|
"started_at"
|
|
],
|
|
"title": "Session",
|
|
"description": "A single session of an interaction with an Agentic System."
|
|
},
|
|
"ShieldCallStep": {
|
|
"type": "object",
|
|
"properties": {
|
|
"turn_id": {
|
|
"type": "string",
|
|
"description": "The ID of the turn."
|
|
},
|
|
"step_id": {
|
|
"type": "string",
|
|
"description": "The ID of the step."
|
|
},
|
|
"started_at": {
|
|
"type": "string",
|
|
"format": "date-time",
|
|
"description": "The time the step started."
|
|
},
|
|
"completed_at": {
|
|
"type": "string",
|
|
"format": "date-time",
|
|
"description": "The time the step completed."
|
|
},
|
|
"step_type": {
|
|
"type": "string",
|
|
"enum": [
|
|
"inference",
|
|
"tool_execution",
|
|
"shield_call",
|
|
"memory_retrieval"
|
|
],
|
|
"title": "StepType",
|
|
"description": "Type of the step in an agent turn.",
|
|
"const": "shield_call",
|
|
"default": "shield_call"
|
|
},
|
|
"violation": {
|
|
"$ref": "#/components/schemas/SafetyViolation",
|
|
"description": "The violation from the shield call."
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"turn_id",
|
|
"step_id",
|
|
"step_type"
|
|
],
|
|
"title": "ShieldCallStep",
|
|
"description": "A shield call step in an agent turn."
|
|
},
|
|
"TextContentItem": {
|
|
"type": "object",
|
|
"properties": {
|
|
"type": {
|
|
"type": "string",
|
|
"const": "text",
|
|
"default": "text",
|
|
"description": "Discriminator type of the content item. Always \"text\""
|
|
},
|
|
"text": {
|
|
"type": "string",
|
|
"description": "Text content"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"type",
|
|
"text"
|
|
],
|
|
"title": "TextContentItem",
|
|
"description": "A text content item"
|
|
},
|
|
"ToolCall": {
|
|
"type": "object",
|
|
"properties": {
|
|
"call_id": {
|
|
"type": "string"
|
|
},
|
|
"tool_name": {
|
|
"oneOf": [
|
|
{
|
|
"type": "string",
|
|
"enum": [
|
|
"brave_search",
|
|
"wolfram_alpha",
|
|
"photogen",
|
|
"code_interpreter"
|
|
],
|
|
"title": "BuiltinTool"
|
|
},
|
|
{
|
|
"type": "string"
|
|
}
|
|
]
|
|
},
|
|
"arguments": {
|
|
"type": "string"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"call_id",
|
|
"tool_name",
|
|
"arguments"
|
|
],
|
|
"title": "ToolCall"
|
|
},
|
|
"ToolExecutionStep": {
|
|
"type": "object",
|
|
"properties": {
|
|
"turn_id": {
|
|
"type": "string",
|
|
"description": "The ID of the turn."
|
|
},
|
|
"step_id": {
|
|
"type": "string",
|
|
"description": "The ID of the step."
|
|
},
|
|
"started_at": {
|
|
"type": "string",
|
|
"format": "date-time",
|
|
"description": "The time the step started."
|
|
},
|
|
"completed_at": {
|
|
"type": "string",
|
|
"format": "date-time",
|
|
"description": "The time the step completed."
|
|
},
|
|
"step_type": {
|
|
"type": "string",
|
|
"enum": [
|
|
"inference",
|
|
"tool_execution",
|
|
"shield_call",
|
|
"memory_retrieval"
|
|
],
|
|
"title": "StepType",
|
|
"description": "Type of the step in an agent turn.",
|
|
"const": "tool_execution",
|
|
"default": "tool_execution"
|
|
},
|
|
"tool_calls": {
|
|
"type": "array",
|
|
"items": {
|
|
"$ref": "#/components/schemas/ToolCall"
|
|
},
|
|
"description": "The tool calls to execute."
|
|
},
|
|
"tool_responses": {
|
|
"type": "array",
|
|
"items": {
|
|
"$ref": "#/components/schemas/ToolResponse"
|
|
},
|
|
"description": "The tool responses from the tool calls."
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"turn_id",
|
|
"step_id",
|
|
"step_type",
|
|
"tool_calls",
|
|
"tool_responses"
|
|
],
|
|
"title": "ToolExecutionStep",
|
|
"description": "A tool execution step in an agent turn."
|
|
},
|
|
"ToolResponse": {
|
|
"type": "object",
|
|
"properties": {
|
|
"call_id": {
|
|
"type": "string",
|
|
"description": "Unique identifier for the tool call this response is for"
|
|
},
|
|
"tool_name": {
|
|
"oneOf": [
|
|
{
|
|
"type": "string",
|
|
"enum": [
|
|
"brave_search",
|
|
"wolfram_alpha",
|
|
"photogen",
|
|
"code_interpreter"
|
|
],
|
|
"title": "BuiltinTool"
|
|
},
|
|
{
|
|
"type": "string"
|
|
}
|
|
],
|
|
"description": "Name of the tool that was invoked"
|
|
},
|
|
"content": {
|
|
"$ref": "#/components/schemas/InterleavedContent",
|
|
"description": "The response content from the tool"
|
|
},
|
|
"metadata": {
|
|
"type": "object",
|
|
"additionalProperties": {
|
|
"oneOf": [
|
|
{
|
|
"type": "null"
|
|
},
|
|
{
|
|
"type": "boolean"
|
|
},
|
|
{
|
|
"type": "number"
|
|
},
|
|
{
|
|
"type": "string"
|
|
},
|
|
{
|
|
"type": "array"
|
|
},
|
|
{
|
|
"type": "object"
|
|
}
|
|
]
|
|
},
|
|
"description": "(Optional) Additional metadata about the tool response"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"call_id",
|
|
"tool_name",
|
|
"content"
|
|
],
|
|
"title": "ToolResponse",
|
|
"description": "Response from a tool invocation."
|
|
},
|
|
"ToolResponseMessage": {
|
|
"type": "object",
|
|
"properties": {
|
|
"role": {
|
|
"type": "string",
|
|
"const": "tool",
|
|
"default": "tool",
|
|
"description": "Must be \"tool\" to identify this as a tool response"
|
|
},
|
|
"call_id": {
|
|
"type": "string",
|
|
"description": "Unique identifier for the tool call this response is for"
|
|
},
|
|
"content": {
|
|
"$ref": "#/components/schemas/InterleavedContent",
|
|
"description": "The response content from the tool"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"role",
|
|
"call_id",
|
|
"content"
|
|
],
|
|
"title": "ToolResponseMessage",
|
|
"description": "A message representing the result of a tool invocation."
|
|
},
|
|
"Turn": {
|
|
"type": "object",
|
|
"properties": {
|
|
"turn_id": {
|
|
"type": "string",
|
|
"description": "Unique identifier for the turn within a session"
|
|
},
|
|
"session_id": {
|
|
"type": "string",
|
|
"description": "Unique identifier for the conversation session"
|
|
},
|
|
"input_messages": {
|
|
"type": "array",
|
|
"items": {
|
|
"oneOf": [
|
|
{
|
|
"$ref": "#/components/schemas/UserMessage"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/ToolResponseMessage"
|
|
}
|
|
]
|
|
},
|
|
"description": "List of messages that initiated this turn"
|
|
},
|
|
"steps": {
|
|
"type": "array",
|
|
"items": {
|
|
"oneOf": [
|
|
{
|
|
"$ref": "#/components/schemas/InferenceStep"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/ToolExecutionStep"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/ShieldCallStep"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/MemoryRetrievalStep"
|
|
}
|
|
],
|
|
"discriminator": {
|
|
"propertyName": "step_type",
|
|
"mapping": {
|
|
"inference": "#/components/schemas/InferenceStep",
|
|
"tool_execution": "#/components/schemas/ToolExecutionStep",
|
|
"shield_call": "#/components/schemas/ShieldCallStep",
|
|
"memory_retrieval": "#/components/schemas/MemoryRetrievalStep"
|
|
}
|
|
}
|
|
},
|
|
"description": "Ordered list of processing steps executed during this turn"
|
|
},
|
|
"output_message": {
|
|
"$ref": "#/components/schemas/CompletionMessage",
|
|
"description": "The model's generated response containing content and metadata"
|
|
},
|
|
"output_attachments": {
|
|
"type": "array",
|
|
"items": {
|
|
"type": "object",
|
|
"properties": {
|
|
"content": {
|
|
"oneOf": [
|
|
{
|
|
"type": "string"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/InterleavedContentItem"
|
|
},
|
|
{
|
|
"type": "array",
|
|
"items": {
|
|
"$ref": "#/components/schemas/InterleavedContentItem"
|
|
}
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/URL"
|
|
}
|
|
],
|
|
"description": "The content of the attachment."
|
|
},
|
|
"mime_type": {
|
|
"type": "string",
|
|
"description": "The MIME type of the attachment."
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"content",
|
|
"mime_type"
|
|
],
|
|
"title": "Attachment",
|
|
"description": "An attachment to an agent turn."
|
|
},
|
|
"description": "(Optional) Files or media attached to the agent's response"
|
|
},
|
|
"started_at": {
|
|
"type": "string",
|
|
"format": "date-time",
|
|
"description": "Timestamp when the turn began"
|
|
},
|
|
"completed_at": {
|
|
"type": "string",
|
|
"format": "date-time",
|
|
"description": "(Optional) Timestamp when the turn finished, if completed"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"turn_id",
|
|
"session_id",
|
|
"input_messages",
|
|
"steps",
|
|
"output_message",
|
|
"started_at"
|
|
],
|
|
"title": "Turn",
|
|
"description": "A single turn in an interaction with an Agentic System."
|
|
},
|
|
"URL": {
|
|
"type": "object",
|
|
"properties": {
|
|
"uri": {
|
|
"type": "string",
|
|
"description": "The URL string pointing to the resource"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"uri"
|
|
],
|
|
"title": "URL",
|
|
"description": "A URL reference to external content."
|
|
},
|
|
"UserMessage": {
|
|
"type": "object",
|
|
"properties": {
|
|
"role": {
|
|
"type": "string",
|
|
"const": "user",
|
|
"default": "user",
|
|
"description": "Must be \"user\" to identify this as a user message"
|
|
},
|
|
"content": {
|
|
"$ref": "#/components/schemas/InterleavedContent",
|
|
"description": "The content of the message, which can include text and other media"
|
|
},
|
|
"context": {
|
|
"$ref": "#/components/schemas/InterleavedContent",
|
|
"description": "(Optional) This field is used internally by Llama Stack to pass RAG context. This field may be removed in the API in the future."
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"role",
|
|
"content"
|
|
],
|
|
"title": "UserMessage",
|
|
"description": "A message from the user in a chat conversation."
|
|
},
|
|
"ViolationLevel": {
|
|
"type": "string",
|
|
"enum": [
|
|
"info",
|
|
"warn",
|
|
"error"
|
|
],
|
|
"title": "ViolationLevel",
|
|
"description": "Severity level of a safety violation."
|
|
},
|
|
"CreateAgentTurnRequest": {
|
|
"type": "object",
|
|
"properties": {
|
|
"messages": {
|
|
"type": "array",
|
|
"items": {
|
|
"oneOf": [
|
|
{
|
|
"$ref": "#/components/schemas/UserMessage"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/ToolResponseMessage"
|
|
}
|
|
]
|
|
},
|
|
"description": "List of messages to start the turn with."
|
|
},
|
|
"stream": {
|
|
"type": "boolean",
|
|
"description": "(Optional) If True, generate an SSE event stream of the response. Defaults to False."
|
|
},
|
|
"documents": {
|
|
"type": "array",
|
|
"items": {
|
|
"type": "object",
|
|
"properties": {
|
|
"content": {
|
|
"oneOf": [
|
|
{
|
|
"type": "string"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/InterleavedContentItem"
|
|
},
|
|
{
|
|
"type": "array",
|
|
"items": {
|
|
"$ref": "#/components/schemas/InterleavedContentItem"
|
|
}
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/URL"
|
|
}
|
|
],
|
|
"description": "The content of the document."
|
|
},
|
|
"mime_type": {
|
|
"type": "string",
|
|
"description": "The MIME type of the document."
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"content",
|
|
"mime_type"
|
|
],
|
|
"title": "Document",
|
|
"description": "A document to be used by an agent."
|
|
},
|
|
"description": "(Optional) List of documents to create the turn with."
|
|
},
|
|
"toolgroups": {
|
|
"type": "array",
|
|
"items": {
|
|
"$ref": "#/components/schemas/AgentTool"
|
|
},
|
|
"description": "(Optional) List of toolgroups to create the turn with, will be used in addition to the agent's config toolgroups for the request."
|
|
},
|
|
"tool_config": {
|
|
"$ref": "#/components/schemas/ToolConfig",
|
|
"description": "(Optional) The tool configuration to create the turn with, will be used to override the agent's tool_config."
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"messages"
|
|
],
|
|
"title": "CreateAgentTurnRequest"
|
|
},
|
|
"AgentTurnResponseEvent": {
|
|
"type": "object",
|
|
"properties": {
|
|
"payload": {
|
|
"oneOf": [
|
|
{
|
|
"$ref": "#/components/schemas/AgentTurnResponseStepStartPayload"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/AgentTurnResponseStepProgressPayload"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/AgentTurnResponseStepCompletePayload"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/AgentTurnResponseTurnStartPayload"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/AgentTurnResponseTurnCompletePayload"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/AgentTurnResponseTurnAwaitingInputPayload"
|
|
}
|
|
],
|
|
"discriminator": {
|
|
"propertyName": "event_type",
|
|
"mapping": {
|
|
"step_start": "#/components/schemas/AgentTurnResponseStepStartPayload",
|
|
"step_progress": "#/components/schemas/AgentTurnResponseStepProgressPayload",
|
|
"step_complete": "#/components/schemas/AgentTurnResponseStepCompletePayload",
|
|
"turn_start": "#/components/schemas/AgentTurnResponseTurnStartPayload",
|
|
"turn_complete": "#/components/schemas/AgentTurnResponseTurnCompletePayload",
|
|
"turn_awaiting_input": "#/components/schemas/AgentTurnResponseTurnAwaitingInputPayload"
|
|
}
|
|
},
|
|
"description": "Event-specific payload containing event data"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"payload"
|
|
],
|
|
"title": "AgentTurnResponseEvent",
|
|
"description": "An event in an agent turn response stream."
|
|
},
|
|
"AgentTurnResponseStepCompletePayload": {
|
|
"type": "object",
|
|
"properties": {
|
|
"event_type": {
|
|
"type": "string",
|
|
"enum": [
|
|
"step_start",
|
|
"step_complete",
|
|
"step_progress",
|
|
"turn_start",
|
|
"turn_complete",
|
|
"turn_awaiting_input"
|
|
],
|
|
"const": "step_complete",
|
|
"default": "step_complete",
|
|
"description": "Type of event being reported"
|
|
},
|
|
"step_type": {
|
|
"type": "string",
|
|
"enum": [
|
|
"inference",
|
|
"tool_execution",
|
|
"shield_call",
|
|
"memory_retrieval"
|
|
],
|
|
"description": "Type of step being executed"
|
|
},
|
|
"step_id": {
|
|
"type": "string",
|
|
"description": "Unique identifier for the step within a turn"
|
|
},
|
|
"step_details": {
|
|
"oneOf": [
|
|
{
|
|
"$ref": "#/components/schemas/InferenceStep"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/ToolExecutionStep"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/ShieldCallStep"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/MemoryRetrievalStep"
|
|
}
|
|
],
|
|
"discriminator": {
|
|
"propertyName": "step_type",
|
|
"mapping": {
|
|
"inference": "#/components/schemas/InferenceStep",
|
|
"tool_execution": "#/components/schemas/ToolExecutionStep",
|
|
"shield_call": "#/components/schemas/ShieldCallStep",
|
|
"memory_retrieval": "#/components/schemas/MemoryRetrievalStep"
|
|
}
|
|
},
|
|
"description": "Complete details of the executed step"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"event_type",
|
|
"step_type",
|
|
"step_id",
|
|
"step_details"
|
|
],
|
|
"title": "AgentTurnResponseStepCompletePayload",
|
|
"description": "Payload for step completion events in agent turn responses."
|
|
},
|
|
"AgentTurnResponseStepProgressPayload": {
|
|
"type": "object",
|
|
"properties": {
|
|
"event_type": {
|
|
"type": "string",
|
|
"enum": [
|
|
"step_start",
|
|
"step_complete",
|
|
"step_progress",
|
|
"turn_start",
|
|
"turn_complete",
|
|
"turn_awaiting_input"
|
|
],
|
|
"const": "step_progress",
|
|
"default": "step_progress",
|
|
"description": "Type of event being reported"
|
|
},
|
|
"step_type": {
|
|
"type": "string",
|
|
"enum": [
|
|
"inference",
|
|
"tool_execution",
|
|
"shield_call",
|
|
"memory_retrieval"
|
|
],
|
|
"description": "Type of step being executed"
|
|
},
|
|
"step_id": {
|
|
"type": "string",
|
|
"description": "Unique identifier for the step within a turn"
|
|
},
|
|
"delta": {
|
|
"oneOf": [
|
|
{
|
|
"$ref": "#/components/schemas/TextDelta"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/ImageDelta"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/ToolCallDelta"
|
|
}
|
|
],
|
|
"discriminator": {
|
|
"propertyName": "type",
|
|
"mapping": {
|
|
"text": "#/components/schemas/TextDelta",
|
|
"image": "#/components/schemas/ImageDelta",
|
|
"tool_call": "#/components/schemas/ToolCallDelta"
|
|
}
|
|
},
|
|
"description": "Incremental content changes during step execution"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"event_type",
|
|
"step_type",
|
|
"step_id",
|
|
"delta"
|
|
],
|
|
"title": "AgentTurnResponseStepProgressPayload",
|
|
"description": "Payload for step progress events in agent turn responses."
|
|
},
|
|
"AgentTurnResponseStepStartPayload": {
|
|
"type": "object",
|
|
"properties": {
|
|
"event_type": {
|
|
"type": "string",
|
|
"enum": [
|
|
"step_start",
|
|
"step_complete",
|
|
"step_progress",
|
|
"turn_start",
|
|
"turn_complete",
|
|
"turn_awaiting_input"
|
|
],
|
|
"const": "step_start",
|
|
"default": "step_start",
|
|
"description": "Type of event being reported"
|
|
},
|
|
"step_type": {
|
|
"type": "string",
|
|
"enum": [
|
|
"inference",
|
|
"tool_execution",
|
|
"shield_call",
|
|
"memory_retrieval"
|
|
],
|
|
"description": "Type of step being executed"
|
|
},
|
|
"step_id": {
|
|
"type": "string",
|
|
"description": "Unique identifier for the step within a turn"
|
|
},
|
|
"metadata": {
|
|
"type": "object",
|
|
"additionalProperties": {
|
|
"oneOf": [
|
|
{
|
|
"type": "null"
|
|
},
|
|
{
|
|
"type": "boolean"
|
|
},
|
|
{
|
|
"type": "number"
|
|
},
|
|
{
|
|
"type": "string"
|
|
},
|
|
{
|
|
"type": "array"
|
|
},
|
|
{
|
|
"type": "object"
|
|
}
|
|
]
|
|
},
|
|
"description": "(Optional) Additional metadata for the step"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"event_type",
|
|
"step_type",
|
|
"step_id"
|
|
],
|
|
"title": "AgentTurnResponseStepStartPayload",
|
|
"description": "Payload for step start events in agent turn responses."
|
|
},
|
|
"AgentTurnResponseStreamChunk": {
|
|
"type": "object",
|
|
"properties": {
|
|
"event": {
|
|
"$ref": "#/components/schemas/AgentTurnResponseEvent",
|
|
"description": "Individual event in the agent turn response stream"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"event"
|
|
],
|
|
"title": "AgentTurnResponseStreamChunk",
|
|
"description": "Streamed agent turn completion response."
|
|
},
|
|
"AgentTurnResponseTurnAwaitingInputPayload": {
|
|
"type": "object",
|
|
"properties": {
|
|
"event_type": {
|
|
"type": "string",
|
|
"enum": [
|
|
"step_start",
|
|
"step_complete",
|
|
"step_progress",
|
|
"turn_start",
|
|
"turn_complete",
|
|
"turn_awaiting_input"
|
|
],
|
|
"const": "turn_awaiting_input",
|
|
"default": "turn_awaiting_input",
|
|
"description": "Type of event being reported"
|
|
},
|
|
"turn": {
|
|
"$ref": "#/components/schemas/Turn",
|
|
"description": "Turn data when waiting for external tool responses"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"event_type",
|
|
"turn"
|
|
],
|
|
"title": "AgentTurnResponseTurnAwaitingInputPayload",
|
|
"description": "Payload for turn awaiting input events in agent turn responses."
|
|
},
|
|
"AgentTurnResponseTurnCompletePayload": {
|
|
"type": "object",
|
|
"properties": {
|
|
"event_type": {
|
|
"type": "string",
|
|
"enum": [
|
|
"step_start",
|
|
"step_complete",
|
|
"step_progress",
|
|
"turn_start",
|
|
"turn_complete",
|
|
"turn_awaiting_input"
|
|
],
|
|
"const": "turn_complete",
|
|
"default": "turn_complete",
|
|
"description": "Type of event being reported"
|
|
},
|
|
"turn": {
|
|
"$ref": "#/components/schemas/Turn",
|
|
"description": "Complete turn data including all steps and results"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"event_type",
|
|
"turn"
|
|
],
|
|
"title": "AgentTurnResponseTurnCompletePayload",
|
|
"description": "Payload for turn completion events in agent turn responses."
|
|
},
|
|
"AgentTurnResponseTurnStartPayload": {
|
|
"type": "object",
|
|
"properties": {
|
|
"event_type": {
|
|
"type": "string",
|
|
"enum": [
|
|
"step_start",
|
|
"step_complete",
|
|
"step_progress",
|
|
"turn_start",
|
|
"turn_complete",
|
|
"turn_awaiting_input"
|
|
],
|
|
"const": "turn_start",
|
|
"default": "turn_start",
|
|
"description": "Type of event being reported"
|
|
},
|
|
"turn_id": {
|
|
"type": "string",
|
|
"description": "Unique identifier for the turn within a session"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"event_type",
|
|
"turn_id"
|
|
],
|
|
"title": "AgentTurnResponseTurnStartPayload",
|
|
"description": "Payload for turn start events in agent turn responses."
|
|
},
|
|
"ImageDelta": {
|
|
"type": "object",
|
|
"properties": {
|
|
"type": {
|
|
"type": "string",
|
|
"const": "image",
|
|
"default": "image",
|
|
"description": "Discriminator type of the delta. Always \"image\""
|
|
},
|
|
"image": {
|
|
"type": "string",
|
|
"contentEncoding": "base64",
|
|
"description": "The incremental image data as bytes"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"type",
|
|
"image"
|
|
],
|
|
"title": "ImageDelta",
|
|
"description": "An image content delta for streaming responses."
|
|
},
|
|
"TextDelta": {
|
|
"type": "object",
|
|
"properties": {
|
|
"type": {
|
|
"type": "string",
|
|
"const": "text",
|
|
"default": "text",
|
|
"description": "Discriminator type of the delta. Always \"text\""
|
|
},
|
|
"text": {
|
|
"type": "string",
|
|
"description": "The incremental text content"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"type",
|
|
"text"
|
|
],
|
|
"title": "TextDelta",
|
|
"description": "A text content delta for streaming responses."
|
|
},
|
|
"ToolCallDelta": {
|
|
"type": "object",
|
|
"properties": {
|
|
"type": {
|
|
"type": "string",
|
|
"const": "tool_call",
|
|
"default": "tool_call",
|
|
"description": "Discriminator type of the delta. Always \"tool_call\""
|
|
},
|
|
"tool_call": {
|
|
"oneOf": [
|
|
{
|
|
"type": "string"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/ToolCall"
|
|
}
|
|
],
|
|
"description": "Either an in-progress tool call string or the final parsed tool call"
|
|
},
|
|
"parse_status": {
|
|
"type": "string",
|
|
"enum": [
|
|
"started",
|
|
"in_progress",
|
|
"failed",
|
|
"succeeded"
|
|
],
|
|
"description": "Current parsing status of the tool call"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"type",
|
|
"tool_call",
|
|
"parse_status"
|
|
],
|
|
"title": "ToolCallDelta",
|
|
"description": "A tool call content delta for streaming responses."
|
|
},
|
|
"ResumeAgentTurnRequest": {
|
|
"type": "object",
|
|
"properties": {
|
|
"tool_responses": {
|
|
"type": "array",
|
|
"items": {
|
|
"$ref": "#/components/schemas/ToolResponse"
|
|
},
|
|
"description": "The tool call responses to resume the turn with."
|
|
},
|
|
"stream": {
|
|
"type": "boolean",
|
|
"description": "Whether to stream the response."
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"tool_responses"
|
|
],
|
|
"title": "ResumeAgentTurnRequest"
|
|
},
|
|
"AgentStepResponse": {
|
|
"type": "object",
|
|
"properties": {
|
|
"step": {
|
|
"oneOf": [
|
|
{
|
|
"$ref": "#/components/schemas/InferenceStep"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/ToolExecutionStep"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/ShieldCallStep"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/MemoryRetrievalStep"
|
|
}
|
|
],
|
|
"discriminator": {
|
|
"propertyName": "step_type",
|
|
"mapping": {
|
|
"inference": "#/components/schemas/InferenceStep",
|
|
"tool_execution": "#/components/schemas/ToolExecutionStep",
|
|
"shield_call": "#/components/schemas/ShieldCallStep",
|
|
"memory_retrieval": "#/components/schemas/MemoryRetrievalStep"
|
|
}
|
|
},
|
|
"description": "The complete step data and execution details"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"step"
|
|
],
|
|
"title": "AgentStepResponse",
|
|
"description": "Response containing details of a specific agent step."
|
|
},
|
|
"Benchmark": {
|
|
"type": "object",
|
|
"properties": {
|
|
"identifier": {
|
|
"type": "string"
|
|
},
|
|
"provider_resource_id": {
|
|
"type": "string"
|
|
},
|
|
"provider_id": {
|
|
"type": "string"
|
|
},
|
|
"type": {
|
|
"type": "string",
|
|
"enum": [
|
|
"model",
|
|
"shield",
|
|
"vector_store",
|
|
"dataset",
|
|
"scoring_function",
|
|
"benchmark",
|
|
"tool",
|
|
"tool_group",
|
|
"prompt"
|
|
],
|
|
"const": "benchmark",
|
|
"default": "benchmark",
|
|
"description": "The resource type, always benchmark"
|
|
},
|
|
"dataset_id": {
|
|
"type": "string",
|
|
"description": "Identifier of the dataset to use for the benchmark evaluation"
|
|
},
|
|
"scoring_functions": {
|
|
"type": "array",
|
|
"items": {
|
|
"type": "string"
|
|
},
|
|
"description": "List of scoring function identifiers to apply during evaluation"
|
|
},
|
|
"metadata": {
|
|
"type": "object",
|
|
"additionalProperties": {
|
|
"oneOf": [
|
|
{
|
|
"type": "null"
|
|
},
|
|
{
|
|
"type": "boolean"
|
|
},
|
|
{
|
|
"type": "number"
|
|
},
|
|
{
|
|
"type": "string"
|
|
},
|
|
{
|
|
"type": "array"
|
|
},
|
|
{
|
|
"type": "object"
|
|
}
|
|
]
|
|
},
|
|
"description": "Metadata for this evaluation task"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"identifier",
|
|
"provider_id",
|
|
"type",
|
|
"dataset_id",
|
|
"scoring_functions",
|
|
"metadata"
|
|
],
|
|
"title": "Benchmark",
|
|
"description": "A benchmark resource for evaluating model performance."
|
|
},
|
|
"ListBenchmarksResponse": {
|
|
"type": "object",
|
|
"properties": {
|
|
"data": {
|
|
"type": "array",
|
|
"items": {
|
|
"$ref": "#/components/schemas/Benchmark"
|
|
}
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"data"
|
|
],
|
|
"title": "ListBenchmarksResponse"
|
|
},
|
|
"RegisterBenchmarkRequest": {
|
|
"type": "object",
|
|
"properties": {
|
|
"benchmark_id": {
|
|
"type": "string",
|
|
"description": "The ID of the benchmark to register."
|
|
},
|
|
"dataset_id": {
|
|
"type": "string",
|
|
"description": "The ID of the dataset to use for the benchmark."
|
|
},
|
|
"scoring_functions": {
|
|
"type": "array",
|
|
"items": {
|
|
"type": "string"
|
|
},
|
|
"description": "The scoring functions to use for the benchmark."
|
|
},
|
|
"provider_benchmark_id": {
|
|
"type": "string",
|
|
"description": "The ID of the provider benchmark to use for the benchmark."
|
|
},
|
|
"provider_id": {
|
|
"type": "string",
|
|
"description": "The ID of the provider to use for the benchmark."
|
|
},
|
|
"metadata": {
|
|
"type": "object",
|
|
"additionalProperties": {
|
|
"oneOf": [
|
|
{
|
|
"type": "null"
|
|
},
|
|
{
|
|
"type": "boolean"
|
|
},
|
|
{
|
|
"type": "number"
|
|
},
|
|
{
|
|
"type": "string"
|
|
},
|
|
{
|
|
"type": "array"
|
|
},
|
|
{
|
|
"type": "object"
|
|
}
|
|
]
|
|
},
|
|
"description": "The metadata to use for the benchmark."
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"benchmark_id",
|
|
"dataset_id",
|
|
"scoring_functions"
|
|
],
|
|
"title": "RegisterBenchmarkRequest"
|
|
},
|
|
"AgentCandidate": {
|
|
"type": "object",
|
|
"properties": {
|
|
"type": {
|
|
"type": "string",
|
|
"const": "agent",
|
|
"default": "agent"
|
|
},
|
|
"config": {
|
|
"$ref": "#/components/schemas/AgentConfig",
|
|
"description": "The configuration for the agent candidate."
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"type",
|
|
"config"
|
|
],
|
|
"title": "AgentCandidate",
|
|
"description": "An agent candidate for evaluation."
|
|
},
|
|
"AggregationFunctionType": {
|
|
"type": "string",
|
|
"enum": [
|
|
"average",
|
|
"weighted_average",
|
|
"median",
|
|
"categorical_count",
|
|
"accuracy"
|
|
],
|
|
"title": "AggregationFunctionType",
|
|
"description": "Types of aggregation functions for scoring results."
|
|
},
|
|
"BasicScoringFnParams": {
|
|
"type": "object",
|
|
"properties": {
|
|
"type": {
|
|
"$ref": "#/components/schemas/ScoringFnParamsType",
|
|
"const": "basic",
|
|
"default": "basic",
|
|
"description": "The type of scoring function parameters, always basic"
|
|
},
|
|
"aggregation_functions": {
|
|
"type": "array",
|
|
"items": {
|
|
"$ref": "#/components/schemas/AggregationFunctionType"
|
|
},
|
|
"description": "Aggregation functions to apply to the scores of each row"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"type",
|
|
"aggregation_functions"
|
|
],
|
|
"title": "BasicScoringFnParams",
|
|
"description": "Parameters for basic scoring function configuration."
|
|
},
|
|
"BenchmarkConfig": {
|
|
"type": "object",
|
|
"properties": {
|
|
"eval_candidate": {
|
|
"oneOf": [
|
|
{
|
|
"$ref": "#/components/schemas/ModelCandidate"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/AgentCandidate"
|
|
}
|
|
],
|
|
"discriminator": {
|
|
"propertyName": "type",
|
|
"mapping": {
|
|
"model": "#/components/schemas/ModelCandidate",
|
|
"agent": "#/components/schemas/AgentCandidate"
|
|
}
|
|
},
|
|
"description": "The candidate to evaluate."
|
|
},
|
|
"scoring_params": {
|
|
"type": "object",
|
|
"additionalProperties": {
|
|
"$ref": "#/components/schemas/ScoringFnParams"
|
|
},
|
|
"description": "Map between scoring function id and parameters for each scoring function you want to run"
|
|
},
|
|
"num_examples": {
|
|
"type": "integer",
|
|
"description": "(Optional) The number of examples to evaluate. If not provided, all examples in the dataset will be evaluated"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"eval_candidate",
|
|
"scoring_params"
|
|
],
|
|
"title": "BenchmarkConfig",
|
|
"description": "A benchmark configuration for evaluation."
|
|
},
|
|
"LLMAsJudgeScoringFnParams": {
|
|
"type": "object",
|
|
"properties": {
|
|
"type": {
|
|
"$ref": "#/components/schemas/ScoringFnParamsType",
|
|
"const": "llm_as_judge",
|
|
"default": "llm_as_judge",
|
|
"description": "The type of scoring function parameters, always llm_as_judge"
|
|
},
|
|
"judge_model": {
|
|
"type": "string",
|
|
"description": "Identifier of the LLM model to use as a judge for scoring"
|
|
},
|
|
"prompt_template": {
|
|
"type": "string",
|
|
"description": "(Optional) Custom prompt template for the judge model"
|
|
},
|
|
"judge_score_regexes": {
|
|
"type": "array",
|
|
"items": {
|
|
"type": "string"
|
|
},
|
|
"description": "Regexes to extract the answer from generated response"
|
|
},
|
|
"aggregation_functions": {
|
|
"type": "array",
|
|
"items": {
|
|
"$ref": "#/components/schemas/AggregationFunctionType"
|
|
},
|
|
"description": "Aggregation functions to apply to the scores of each row"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"type",
|
|
"judge_model",
|
|
"judge_score_regexes",
|
|
"aggregation_functions"
|
|
],
|
|
"title": "LLMAsJudgeScoringFnParams",
|
|
"description": "Parameters for LLM-as-judge scoring function configuration."
|
|
},
|
|
"ModelCandidate": {
|
|
"type": "object",
|
|
"properties": {
|
|
"type": {
|
|
"type": "string",
|
|
"const": "model",
|
|
"default": "model"
|
|
},
|
|
"model": {
|
|
"type": "string",
|
|
"description": "The model ID to evaluate."
|
|
},
|
|
"sampling_params": {
|
|
"$ref": "#/components/schemas/SamplingParams",
|
|
"description": "The sampling parameters for the model."
|
|
},
|
|
"system_message": {
|
|
"$ref": "#/components/schemas/SystemMessage",
|
|
"description": "(Optional) The system message providing instructions or context to the model."
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"type",
|
|
"model",
|
|
"sampling_params"
|
|
],
|
|
"title": "ModelCandidate",
|
|
"description": "A model candidate for evaluation."
|
|
},
|
|
"RegexParserScoringFnParams": {
|
|
"type": "object",
|
|
"properties": {
|
|
"type": {
|
|
"$ref": "#/components/schemas/ScoringFnParamsType",
|
|
"const": "regex_parser",
|
|
"default": "regex_parser",
|
|
"description": "The type of scoring function parameters, always regex_parser"
|
|
},
|
|
"parsing_regexes": {
|
|
"type": "array",
|
|
"items": {
|
|
"type": "string"
|
|
},
|
|
"description": "Regex to extract the answer from generated response"
|
|
},
|
|
"aggregation_functions": {
|
|
"type": "array",
|
|
"items": {
|
|
"$ref": "#/components/schemas/AggregationFunctionType"
|
|
},
|
|
"description": "Aggregation functions to apply to the scores of each row"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"type",
|
|
"parsing_regexes",
|
|
"aggregation_functions"
|
|
],
|
|
"title": "RegexParserScoringFnParams",
|
|
"description": "Parameters for regex parser scoring function configuration."
|
|
},
|
|
"ScoringFnParams": {
|
|
"oneOf": [
|
|
{
|
|
"$ref": "#/components/schemas/LLMAsJudgeScoringFnParams"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/RegexParserScoringFnParams"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/BasicScoringFnParams"
|
|
}
|
|
],
|
|
"discriminator": {
|
|
"propertyName": "type",
|
|
"mapping": {
|
|
"llm_as_judge": "#/components/schemas/LLMAsJudgeScoringFnParams",
|
|
"regex_parser": "#/components/schemas/RegexParserScoringFnParams",
|
|
"basic": "#/components/schemas/BasicScoringFnParams"
|
|
}
|
|
}
|
|
},
|
|
"ScoringFnParamsType": {
|
|
"type": "string",
|
|
"enum": [
|
|
"llm_as_judge",
|
|
"regex_parser",
|
|
"basic"
|
|
],
|
|
"title": "ScoringFnParamsType",
|
|
"description": "Types of scoring function parameter configurations."
|
|
},
|
|
"SystemMessage": {
|
|
"type": "object",
|
|
"properties": {
|
|
"role": {
|
|
"type": "string",
|
|
"const": "system",
|
|
"default": "system",
|
|
"description": "Must be \"system\" to identify this as a system message"
|
|
},
|
|
"content": {
|
|
"$ref": "#/components/schemas/InterleavedContent",
|
|
"description": "The content of the \"system prompt\". If multiple system messages are provided, they are concatenated. The underlying Llama Stack code may also add other system messages (for example, for formatting tool definitions)."
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"role",
|
|
"content"
|
|
],
|
|
"title": "SystemMessage",
|
|
"description": "A system message providing instructions or context to the model."
|
|
},
|
|
"EvaluateRowsRequest": {
|
|
"type": "object",
|
|
"properties": {
|
|
"input_rows": {
|
|
"type": "array",
|
|
"items": {
|
|
"type": "object",
|
|
"additionalProperties": {
|
|
"oneOf": [
|
|
{
|
|
"type": "null"
|
|
},
|
|
{
|
|
"type": "boolean"
|
|
},
|
|
{
|
|
"type": "number"
|
|
},
|
|
{
|
|
"type": "string"
|
|
},
|
|
{
|
|
"type": "array"
|
|
},
|
|
{
|
|
"type": "object"
|
|
}
|
|
]
|
|
}
|
|
},
|
|
"description": "The rows to evaluate."
|
|
},
|
|
"scoring_functions": {
|
|
"type": "array",
|
|
"items": {
|
|
"type": "string"
|
|
},
|
|
"description": "The scoring functions to use for the evaluation."
|
|
},
|
|
"benchmark_config": {
|
|
"$ref": "#/components/schemas/BenchmarkConfig",
|
|
"description": "The configuration for the benchmark."
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"input_rows",
|
|
"scoring_functions",
|
|
"benchmark_config"
|
|
],
|
|
"title": "EvaluateRowsRequest"
|
|
},
|
|
"EvaluateResponse": {
|
|
"type": "object",
|
|
"properties": {
|
|
"generations": {
|
|
"type": "array",
|
|
"items": {
|
|
"type": "object",
|
|
"additionalProperties": {
|
|
"oneOf": [
|
|
{
|
|
"type": "null"
|
|
},
|
|
{
|
|
"type": "boolean"
|
|
},
|
|
{
|
|
"type": "number"
|
|
},
|
|
{
|
|
"type": "string"
|
|
},
|
|
{
|
|
"type": "array"
|
|
},
|
|
{
|
|
"type": "object"
|
|
}
|
|
]
|
|
}
|
|
},
|
|
"description": "The generations from the evaluation."
|
|
},
|
|
"scores": {
|
|
"type": "object",
|
|
"additionalProperties": {
|
|
"$ref": "#/components/schemas/ScoringResult"
|
|
},
|
|
"description": "The scores from the evaluation."
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"generations",
|
|
"scores"
|
|
],
|
|
"title": "EvaluateResponse",
|
|
"description": "The response from an evaluation."
|
|
},
|
|
"ScoringResult": {
|
|
"type": "object",
|
|
"properties": {
|
|
"score_rows": {
|
|
"type": "array",
|
|
"items": {
|
|
"type": "object",
|
|
"additionalProperties": {
|
|
"oneOf": [
|
|
{
|
|
"type": "null"
|
|
},
|
|
{
|
|
"type": "boolean"
|
|
},
|
|
{
|
|
"type": "number"
|
|
},
|
|
{
|
|
"type": "string"
|
|
},
|
|
{
|
|
"type": "array"
|
|
},
|
|
{
|
|
"type": "object"
|
|
}
|
|
]
|
|
}
|
|
},
|
|
"description": "The scoring result for each row. Each row is a map of column name to value."
|
|
},
|
|
"aggregated_results": {
|
|
"type": "object",
|
|
"additionalProperties": {
|
|
"oneOf": [
|
|
{
|
|
"type": "null"
|
|
},
|
|
{
|
|
"type": "boolean"
|
|
},
|
|
{
|
|
"type": "number"
|
|
},
|
|
{
|
|
"type": "string"
|
|
},
|
|
{
|
|
"type": "array"
|
|
},
|
|
{
|
|
"type": "object"
|
|
}
|
|
]
|
|
},
|
|
"description": "Map of metric name to aggregated value"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"score_rows",
|
|
"aggregated_results"
|
|
],
|
|
"title": "ScoringResult",
|
|
"description": "A scoring result for a single row."
|
|
},
|
|
"RunEvalRequest": {
|
|
"type": "object",
|
|
"properties": {
|
|
"benchmark_config": {
|
|
"$ref": "#/components/schemas/BenchmarkConfig",
|
|
"description": "The configuration for the benchmark."
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"benchmark_config"
|
|
],
|
|
"title": "RunEvalRequest"
|
|
},
|
|
"Job": {
|
|
"type": "object",
|
|
"properties": {
|
|
"job_id": {
|
|
"type": "string",
|
|
"description": "Unique identifier for the job"
|
|
},
|
|
"status": {
|
|
"type": "string",
|
|
"enum": [
|
|
"completed",
|
|
"in_progress",
|
|
"failed",
|
|
"scheduled",
|
|
"cancelled"
|
|
],
|
|
"description": "Current execution status of the job"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"job_id",
|
|
"status"
|
|
],
|
|
"title": "Job",
|
|
"description": "A job execution instance with status tracking."
|
|
},
|
|
"OpenAIChatCompletionContentPartImageParam": {
|
|
"type": "object",
|
|
"properties": {
|
|
"type": {
|
|
"type": "string",
|
|
"const": "image_url",
|
|
"default": "image_url",
|
|
"description": "Must be \"image_url\" to identify this as image content"
|
|
},
|
|
"image_url": {
|
|
"$ref": "#/components/schemas/OpenAIImageURL",
|
|
"description": "Image URL specification and processing details"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"type",
|
|
"image_url"
|
|
],
|
|
"title": "OpenAIChatCompletionContentPartImageParam",
|
|
"description": "Image content part for OpenAI-compatible chat completion messages."
|
|
},
|
|
"OpenAIChatCompletionContentPartTextParam": {
|
|
"type": "object",
|
|
"properties": {
|
|
"type": {
|
|
"type": "string",
|
|
"const": "text",
|
|
"default": "text",
|
|
"description": "Must be \"text\" to identify this as text content"
|
|
},
|
|
"text": {
|
|
"type": "string",
|
|
"description": "The text content of the message"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"type",
|
|
"text"
|
|
],
|
|
"title": "OpenAIChatCompletionContentPartTextParam",
|
|
"description": "Text content part for OpenAI-compatible chat completion messages."
|
|
},
|
|
"OpenAIImageURL": {
|
|
"type": "object",
|
|
"properties": {
|
|
"url": {
|
|
"type": "string",
|
|
"description": "URL of the image to include in the message"
|
|
},
|
|
"detail": {
|
|
"type": "string",
|
|
"description": "(Optional) Level of detail for image processing. Can be \"low\", \"high\", or \"auto\""
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"url"
|
|
],
|
|
"title": "OpenAIImageURL",
|
|
"description": "Image URL specification for OpenAI-compatible chat completion messages."
|
|
},
|
|
"RerankRequest": {
|
|
"type": "object",
|
|
"properties": {
|
|
"model": {
|
|
"type": "string",
|
|
"description": "The identifier of the reranking model to use."
|
|
},
|
|
"query": {
|
|
"oneOf": [
|
|
{
|
|
"type": "string"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/OpenAIChatCompletionContentPartTextParam"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/OpenAIChatCompletionContentPartImageParam"
|
|
}
|
|
],
|
|
"description": "The search query to rank items against. Can be a string, text content part, or image content part. The input must not exceed the model's max input token length."
|
|
},
|
|
"items": {
|
|
"type": "array",
|
|
"items": {
|
|
"oneOf": [
|
|
{
|
|
"type": "string"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/OpenAIChatCompletionContentPartTextParam"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/OpenAIChatCompletionContentPartImageParam"
|
|
}
|
|
]
|
|
},
|
|
"description": "List of items to rerank. Each item can be a string, text content part, or image content part. Each input must not exceed the model's max input token length."
|
|
},
|
|
"max_num_results": {
|
|
"type": "integer",
|
|
"description": "(Optional) Maximum number of results to return. Default: returns all."
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"model",
|
|
"query",
|
|
"items"
|
|
],
|
|
"title": "RerankRequest"
|
|
},
|
|
"RerankData": {
|
|
"type": "object",
|
|
"properties": {
|
|
"index": {
|
|
"type": "integer",
|
|
"description": "The original index of the document in the input list"
|
|
},
|
|
"relevance_score": {
|
|
"type": "number",
|
|
"description": "The relevance score from the model output. Values are inverted when applicable so that higher scores indicate greater relevance."
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"index",
|
|
"relevance_score"
|
|
],
|
|
"title": "RerankData",
|
|
"description": "A single rerank result from a reranking response."
|
|
},
|
|
"RerankResponse": {
|
|
"type": "object",
|
|
"properties": {
|
|
"data": {
|
|
"type": "array",
|
|
"items": {
|
|
"$ref": "#/components/schemas/RerankData"
|
|
},
|
|
"description": "List of rerank result objects, sorted by relevance score (descending)"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"data"
|
|
],
|
|
"title": "RerankResponse",
|
|
"description": "Response from a reranking request."
|
|
},
|
|
"Checkpoint": {
|
|
"type": "object",
|
|
"properties": {
|
|
"identifier": {
|
|
"type": "string",
|
|
"description": "Unique identifier for the checkpoint"
|
|
},
|
|
"created_at": {
|
|
"type": "string",
|
|
"format": "date-time",
|
|
"description": "Timestamp when the checkpoint was created"
|
|
},
|
|
"epoch": {
|
|
"type": "integer",
|
|
"description": "Training epoch when the checkpoint was saved"
|
|
},
|
|
"post_training_job_id": {
|
|
"type": "string",
|
|
"description": "Identifier of the training job that created this checkpoint"
|
|
},
|
|
"path": {
|
|
"type": "string",
|
|
"description": "File system path where the checkpoint is stored"
|
|
},
|
|
"training_metrics": {
|
|
"$ref": "#/components/schemas/PostTrainingMetric",
|
|
"description": "(Optional) Training metrics associated with this checkpoint"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"identifier",
|
|
"created_at",
|
|
"epoch",
|
|
"post_training_job_id",
|
|
"path"
|
|
],
|
|
"title": "Checkpoint",
|
|
"description": "Checkpoint created during training runs."
|
|
},
|
|
"PostTrainingJobArtifactsResponse": {
|
|
"type": "object",
|
|
"properties": {
|
|
"job_uuid": {
|
|
"type": "string",
|
|
"description": "Unique identifier for the training job"
|
|
},
|
|
"checkpoints": {
|
|
"type": "array",
|
|
"items": {
|
|
"$ref": "#/components/schemas/Checkpoint"
|
|
},
|
|
"description": "List of model checkpoints created during training"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"job_uuid",
|
|
"checkpoints"
|
|
],
|
|
"title": "PostTrainingJobArtifactsResponse",
|
|
"description": "Artifacts of a finetuning job."
|
|
},
|
|
"PostTrainingMetric": {
|
|
"type": "object",
|
|
"properties": {
|
|
"epoch": {
|
|
"type": "integer",
|
|
"description": "Training epoch number"
|
|
},
|
|
"train_loss": {
|
|
"type": "number",
|
|
"description": "Loss value on the training dataset"
|
|
},
|
|
"validation_loss": {
|
|
"type": "number",
|
|
"description": "Loss value on the validation dataset"
|
|
},
|
|
"perplexity": {
|
|
"type": "number",
|
|
"description": "Perplexity metric indicating model confidence"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"epoch",
|
|
"train_loss",
|
|
"validation_loss",
|
|
"perplexity"
|
|
],
|
|
"title": "PostTrainingMetric",
|
|
"description": "Training metrics captured during post-training jobs."
|
|
},
|
|
"CancelTrainingJobRequest": {
|
|
"type": "object",
|
|
"properties": {
|
|
"job_uuid": {
|
|
"type": "string",
|
|
"description": "The UUID of the job to cancel."
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"job_uuid"
|
|
],
|
|
"title": "CancelTrainingJobRequest"
|
|
},
|
|
"PostTrainingJobStatusResponse": {
|
|
"type": "object",
|
|
"properties": {
|
|
"job_uuid": {
|
|
"type": "string",
|
|
"description": "Unique identifier for the training job"
|
|
},
|
|
"status": {
|
|
"type": "string",
|
|
"enum": [
|
|
"completed",
|
|
"in_progress",
|
|
"failed",
|
|
"scheduled",
|
|
"cancelled"
|
|
],
|
|
"description": "Current status of the training job"
|
|
},
|
|
"scheduled_at": {
|
|
"type": "string",
|
|
"format": "date-time",
|
|
"description": "(Optional) Timestamp when the job was scheduled"
|
|
},
|
|
"started_at": {
|
|
"type": "string",
|
|
"format": "date-time",
|
|
"description": "(Optional) Timestamp when the job execution began"
|
|
},
|
|
"completed_at": {
|
|
"type": "string",
|
|
"format": "date-time",
|
|
"description": "(Optional) Timestamp when the job finished, if completed"
|
|
},
|
|
"resources_allocated": {
|
|
"type": "object",
|
|
"additionalProperties": {
|
|
"oneOf": [
|
|
{
|
|
"type": "null"
|
|
},
|
|
{
|
|
"type": "boolean"
|
|
},
|
|
{
|
|
"type": "number"
|
|
},
|
|
{
|
|
"type": "string"
|
|
},
|
|
{
|
|
"type": "array"
|
|
},
|
|
{
|
|
"type": "object"
|
|
}
|
|
]
|
|
},
|
|
"description": "(Optional) Information about computational resources allocated to the job"
|
|
},
|
|
"checkpoints": {
|
|
"type": "array",
|
|
"items": {
|
|
"$ref": "#/components/schemas/Checkpoint"
|
|
},
|
|
"description": "List of model checkpoints created during training"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"job_uuid",
|
|
"status",
|
|
"checkpoints"
|
|
],
|
|
"title": "PostTrainingJobStatusResponse",
|
|
"description": "Status of a finetuning job."
|
|
},
|
|
"ListPostTrainingJobsResponse": {
|
|
"type": "object",
|
|
"properties": {
|
|
"data": {
|
|
"type": "array",
|
|
"items": {
|
|
"type": "object",
|
|
"properties": {
|
|
"job_uuid": {
|
|
"type": "string"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"job_uuid"
|
|
],
|
|
"title": "PostTrainingJob"
|
|
}
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"data"
|
|
],
|
|
"title": "ListPostTrainingJobsResponse"
|
|
},
|
|
"DPOAlignmentConfig": {
|
|
"type": "object",
|
|
"properties": {
|
|
"beta": {
|
|
"type": "number",
|
|
"description": "Temperature parameter for the DPO loss"
|
|
},
|
|
"loss_type": {
|
|
"$ref": "#/components/schemas/DPOLossType",
|
|
"default": "sigmoid",
|
|
"description": "The type of loss function to use for DPO"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"beta",
|
|
"loss_type"
|
|
],
|
|
"title": "DPOAlignmentConfig",
|
|
"description": "Configuration for Direct Preference Optimization (DPO) alignment."
|
|
},
|
|
"DPOLossType": {
|
|
"type": "string",
|
|
"enum": [
|
|
"sigmoid",
|
|
"hinge",
|
|
"ipo",
|
|
"kto_pair"
|
|
],
|
|
"title": "DPOLossType"
|
|
},
|
|
"DataConfig": {
|
|
"type": "object",
|
|
"properties": {
|
|
"dataset_id": {
|
|
"type": "string",
|
|
"description": "Unique identifier for the training dataset"
|
|
},
|
|
"batch_size": {
|
|
"type": "integer",
|
|
"description": "Number of samples per training batch"
|
|
},
|
|
"shuffle": {
|
|
"type": "boolean",
|
|
"description": "Whether to shuffle the dataset during training"
|
|
},
|
|
"data_format": {
|
|
"$ref": "#/components/schemas/DatasetFormat",
|
|
"description": "Format of the dataset (instruct or dialog)"
|
|
},
|
|
"validation_dataset_id": {
|
|
"type": "string",
|
|
"description": "(Optional) Unique identifier for the validation dataset"
|
|
},
|
|
"packed": {
|
|
"type": "boolean",
|
|
"default": false,
|
|
"description": "(Optional) Whether to pack multiple samples into a single sequence for efficiency"
|
|
},
|
|
"train_on_input": {
|
|
"type": "boolean",
|
|
"default": false,
|
|
"description": "(Optional) Whether to compute loss on input tokens as well as output tokens"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"dataset_id",
|
|
"batch_size",
|
|
"shuffle",
|
|
"data_format"
|
|
],
|
|
"title": "DataConfig",
|
|
"description": "Configuration for training data and data loading."
|
|
},
|
|
"DatasetFormat": {
|
|
"type": "string",
|
|
"enum": [
|
|
"instruct",
|
|
"dialog"
|
|
],
|
|
"title": "DatasetFormat",
|
|
"description": "Format of the training dataset."
|
|
},
|
|
"EfficiencyConfig": {
|
|
"type": "object",
|
|
"properties": {
|
|
"enable_activation_checkpointing": {
|
|
"type": "boolean",
|
|
"default": false,
|
|
"description": "(Optional) Whether to use activation checkpointing to reduce memory usage"
|
|
},
|
|
"enable_activation_offloading": {
|
|
"type": "boolean",
|
|
"default": false,
|
|
"description": "(Optional) Whether to offload activations to CPU to save GPU memory"
|
|
},
|
|
"memory_efficient_fsdp_wrap": {
|
|
"type": "boolean",
|
|
"default": false,
|
|
"description": "(Optional) Whether to use memory-efficient FSDP wrapping"
|
|
},
|
|
"fsdp_cpu_offload": {
|
|
"type": "boolean",
|
|
"default": false,
|
|
"description": "(Optional) Whether to offload FSDP parameters to CPU"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"title": "EfficiencyConfig",
|
|
"description": "Configuration for memory and compute efficiency optimizations."
|
|
},
|
|
"OptimizerConfig": {
|
|
"type": "object",
|
|
"properties": {
|
|
"optimizer_type": {
|
|
"$ref": "#/components/schemas/OptimizerType",
|
|
"description": "Type of optimizer to use (adam, adamw, or sgd)"
|
|
},
|
|
"lr": {
|
|
"type": "number",
|
|
"description": "Learning rate for the optimizer"
|
|
},
|
|
"weight_decay": {
|
|
"type": "number",
|
|
"description": "Weight decay coefficient for regularization"
|
|
},
|
|
"num_warmup_steps": {
|
|
"type": "integer",
|
|
"description": "Number of steps for learning rate warmup"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"optimizer_type",
|
|
"lr",
|
|
"weight_decay",
|
|
"num_warmup_steps"
|
|
],
|
|
"title": "OptimizerConfig",
|
|
"description": "Configuration parameters for the optimization algorithm."
|
|
},
|
|
"OptimizerType": {
|
|
"type": "string",
|
|
"enum": [
|
|
"adam",
|
|
"adamw",
|
|
"sgd"
|
|
],
|
|
"title": "OptimizerType",
|
|
"description": "Available optimizer algorithms for training."
|
|
},
|
|
"TrainingConfig": {
|
|
"type": "object",
|
|
"properties": {
|
|
"n_epochs": {
|
|
"type": "integer",
|
|
"description": "Number of training epochs to run"
|
|
},
|
|
"max_steps_per_epoch": {
|
|
"type": "integer",
|
|
"default": 1,
|
|
"description": "Maximum number of steps to run per epoch"
|
|
},
|
|
"gradient_accumulation_steps": {
|
|
"type": "integer",
|
|
"default": 1,
|
|
"description": "Number of steps to accumulate gradients before updating"
|
|
},
|
|
"max_validation_steps": {
|
|
"type": "integer",
|
|
"default": 1,
|
|
"description": "(Optional) Maximum number of validation steps per epoch"
|
|
},
|
|
"data_config": {
|
|
"$ref": "#/components/schemas/DataConfig",
|
|
"description": "(Optional) Configuration for data loading and formatting"
|
|
},
|
|
"optimizer_config": {
|
|
"$ref": "#/components/schemas/OptimizerConfig",
|
|
"description": "(Optional) Configuration for the optimization algorithm"
|
|
},
|
|
"efficiency_config": {
|
|
"$ref": "#/components/schemas/EfficiencyConfig",
|
|
"description": "(Optional) Configuration for memory and compute optimizations"
|
|
},
|
|
"dtype": {
|
|
"type": "string",
|
|
"default": "bf16",
|
|
"description": "(Optional) Data type for model parameters (bf16, fp16, fp32)"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"n_epochs",
|
|
"max_steps_per_epoch",
|
|
"gradient_accumulation_steps"
|
|
],
|
|
"title": "TrainingConfig",
|
|
"description": "Comprehensive configuration for the training process."
|
|
},
|
|
"PreferenceOptimizeRequest": {
|
|
"type": "object",
|
|
"properties": {
|
|
"job_uuid": {
|
|
"type": "string",
|
|
"description": "The UUID of the job to create."
|
|
},
|
|
"finetuned_model": {
|
|
"type": "string",
|
|
"description": "The model to fine-tune."
|
|
},
|
|
"algorithm_config": {
|
|
"$ref": "#/components/schemas/DPOAlignmentConfig",
|
|
"description": "The algorithm configuration."
|
|
},
|
|
"training_config": {
|
|
"$ref": "#/components/schemas/TrainingConfig",
|
|
"description": "The training configuration."
|
|
},
|
|
"hyperparam_search_config": {
|
|
"type": "object",
|
|
"additionalProperties": {
|
|
"oneOf": [
|
|
{
|
|
"type": "null"
|
|
},
|
|
{
|
|
"type": "boolean"
|
|
},
|
|
{
|
|
"type": "number"
|
|
},
|
|
{
|
|
"type": "string"
|
|
},
|
|
{
|
|
"type": "array"
|
|
},
|
|
{
|
|
"type": "object"
|
|
}
|
|
]
|
|
},
|
|
"description": "The hyperparam search configuration."
|
|
},
|
|
"logger_config": {
|
|
"type": "object",
|
|
"additionalProperties": {
|
|
"oneOf": [
|
|
{
|
|
"type": "null"
|
|
},
|
|
{
|
|
"type": "boolean"
|
|
},
|
|
{
|
|
"type": "number"
|
|
},
|
|
{
|
|
"type": "string"
|
|
},
|
|
{
|
|
"type": "array"
|
|
},
|
|
{
|
|
"type": "object"
|
|
}
|
|
]
|
|
},
|
|
"description": "The logger configuration."
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"job_uuid",
|
|
"finetuned_model",
|
|
"algorithm_config",
|
|
"training_config",
|
|
"hyperparam_search_config",
|
|
"logger_config"
|
|
],
|
|
"title": "PreferenceOptimizeRequest"
|
|
},
|
|
"PostTrainingJob": {
|
|
"type": "object",
|
|
"properties": {
|
|
"job_uuid": {
|
|
"type": "string"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"job_uuid"
|
|
],
|
|
"title": "PostTrainingJob"
|
|
},
|
|
"AlgorithmConfig": {
|
|
"oneOf": [
|
|
{
|
|
"$ref": "#/components/schemas/LoraFinetuningConfig"
|
|
},
|
|
{
|
|
"$ref": "#/components/schemas/QATFinetuningConfig"
|
|
}
|
|
],
|
|
"discriminator": {
|
|
"propertyName": "type",
|
|
"mapping": {
|
|
"LoRA": "#/components/schemas/LoraFinetuningConfig",
|
|
"QAT": "#/components/schemas/QATFinetuningConfig"
|
|
}
|
|
}
|
|
},
|
|
"LoraFinetuningConfig": {
|
|
"type": "object",
|
|
"properties": {
|
|
"type": {
|
|
"type": "string",
|
|
"const": "LoRA",
|
|
"default": "LoRA",
|
|
"description": "Algorithm type identifier, always \"LoRA\""
|
|
},
|
|
"lora_attn_modules": {
|
|
"type": "array",
|
|
"items": {
|
|
"type": "string"
|
|
},
|
|
"description": "List of attention module names to apply LoRA to"
|
|
},
|
|
"apply_lora_to_mlp": {
|
|
"type": "boolean",
|
|
"description": "Whether to apply LoRA to MLP layers"
|
|
},
|
|
"apply_lora_to_output": {
|
|
"type": "boolean",
|
|
"description": "Whether to apply LoRA to output projection layers"
|
|
},
|
|
"rank": {
|
|
"type": "integer",
|
|
"description": "Rank of the LoRA adaptation (lower rank = fewer parameters)"
|
|
},
|
|
"alpha": {
|
|
"type": "integer",
|
|
"description": "LoRA scaling parameter that controls adaptation strength"
|
|
},
|
|
"use_dora": {
|
|
"type": "boolean",
|
|
"default": false,
|
|
"description": "(Optional) Whether to use DoRA (Weight-Decomposed Low-Rank Adaptation)"
|
|
},
|
|
"quantize_base": {
|
|
"type": "boolean",
|
|
"default": false,
|
|
"description": "(Optional) Whether to quantize the base model weights"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"type",
|
|
"lora_attn_modules",
|
|
"apply_lora_to_mlp",
|
|
"apply_lora_to_output",
|
|
"rank",
|
|
"alpha"
|
|
],
|
|
"title": "LoraFinetuningConfig",
|
|
"description": "Configuration for Low-Rank Adaptation (LoRA) fine-tuning."
|
|
},
|
|
"QATFinetuningConfig": {
|
|
"type": "object",
|
|
"properties": {
|
|
"type": {
|
|
"type": "string",
|
|
"const": "QAT",
|
|
"default": "QAT",
|
|
"description": "Algorithm type identifier, always \"QAT\""
|
|
},
|
|
"quantizer_name": {
|
|
"type": "string",
|
|
"description": "Name of the quantization algorithm to use"
|
|
},
|
|
"group_size": {
|
|
"type": "integer",
|
|
"description": "Size of groups for grouped quantization"
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"type",
|
|
"quantizer_name",
|
|
"group_size"
|
|
],
|
|
"title": "QATFinetuningConfig",
|
|
"description": "Configuration for Quantization-Aware Training (QAT) fine-tuning."
|
|
},
|
|
"SupervisedFineTuneRequest": {
|
|
"type": "object",
|
|
"properties": {
|
|
"job_uuid": {
|
|
"type": "string",
|
|
"description": "The UUID of the job to create."
|
|
},
|
|
"training_config": {
|
|
"$ref": "#/components/schemas/TrainingConfig",
|
|
"description": "The training configuration."
|
|
},
|
|
"hyperparam_search_config": {
|
|
"type": "object",
|
|
"additionalProperties": {
|
|
"oneOf": [
|
|
{
|
|
"type": "null"
|
|
},
|
|
{
|
|
"type": "boolean"
|
|
},
|
|
{
|
|
"type": "number"
|
|
},
|
|
{
|
|
"type": "string"
|
|
},
|
|
{
|
|
"type": "array"
|
|
},
|
|
{
|
|
"type": "object"
|
|
}
|
|
]
|
|
},
|
|
"description": "The hyperparam search configuration."
|
|
},
|
|
"logger_config": {
|
|
"type": "object",
|
|
"additionalProperties": {
|
|
"oneOf": [
|
|
{
|
|
"type": "null"
|
|
},
|
|
{
|
|
"type": "boolean"
|
|
},
|
|
{
|
|
"type": "number"
|
|
},
|
|
{
|
|
"type": "string"
|
|
},
|
|
{
|
|
"type": "array"
|
|
},
|
|
{
|
|
"type": "object"
|
|
}
|
|
]
|
|
},
|
|
"description": "The logger configuration."
|
|
},
|
|
"model": {
|
|
"type": "string",
|
|
"description": "The model to fine-tune."
|
|
},
|
|
"checkpoint_dir": {
|
|
"type": "string",
|
|
"description": "The directory to save checkpoint(s) to."
|
|
},
|
|
"algorithm_config": {
|
|
"$ref": "#/components/schemas/AlgorithmConfig",
|
|
"description": "The algorithm configuration."
|
|
}
|
|
},
|
|
"additionalProperties": false,
|
|
"required": [
|
|
"job_uuid",
|
|
"training_config",
|
|
"hyperparam_search_config",
|
|
"logger_config"
|
|
],
|
|
"title": "SupervisedFineTuneRequest"
|
|
}
|
|
},
|
|
"responses": {
|
|
"BadRequest400": {
|
|
"description": "The request was invalid or malformed",
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/Error"
|
|
},
|
|
"example": {
|
|
"status": 400,
|
|
"title": "Bad Request",
|
|
"detail": "The request was invalid or malformed"
|
|
}
|
|
}
|
|
}
|
|
},
|
|
"TooManyRequests429": {
|
|
"description": "The client has sent too many requests in a given amount of time",
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/Error"
|
|
},
|
|
"example": {
|
|
"status": 429,
|
|
"title": "Too Many Requests",
|
|
"detail": "You have exceeded the rate limit. Please try again later."
|
|
}
|
|
}
|
|
}
|
|
},
|
|
"InternalServerError500": {
|
|
"description": "The server encountered an unexpected error",
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/Error"
|
|
},
|
|
"example": {
|
|
"status": 500,
|
|
"title": "Internal Server Error",
|
|
"detail": "An unexpected error occurred. Our team has been notified."
|
|
}
|
|
}
|
|
}
|
|
},
|
|
"DefaultError": {
|
|
"description": "An unexpected error occurred",
|
|
"content": {
|
|
"application/json": {
|
|
"schema": {
|
|
"$ref": "#/components/schemas/Error"
|
|
},
|
|
"example": {
|
|
"status": 0,
|
|
"title": "Error",
|
|
"detail": "An unexpected error occurred"
|
|
}
|
|
}
|
|
}
|
|
}
|
|
}
|
|
},
|
|
"security": [
|
|
{
|
|
"Default": []
|
|
}
|
|
],
|
|
"tags": [
|
|
{
|
|
"name": "Agents",
|
|
"description": "APIs for creating and interacting with agentic systems.\n\n## Agents API (Experimental)\n\n> **🧪 EXPERIMENTAL**: This API is in preview and may change based on user feedback. Great for exploring new capabilities and providing feedback to influence the final design.\n\nMain functionalities provided by this API:\n\n- Create agents with specific instructions and ability to use tools.\n- Interactions with agents are grouped into sessions (\"threads\"), and each interaction is called a \"turn\".\n- Agents can be provided with various tools (see the ToolGroups and ToolRuntime APIs for more details).\n- Agents can be provided with various shields (see the Safety API for more details).\n- Agents can also use Memory to retrieve information from knowledge bases. See the RAG Tool and Vector IO APIs for more details.\n\n### 🧪 Feedback Welcome\n\nThis API is actively being developed. We welcome feedback on:\n- API design and usability\n- Performance characteristics\n- Missing features or capabilities\n- Integration patterns\n\n**Provide Feedback**: [GitHub Discussions](https://github.com/llamastack/llama-stack/discussions) or [GitHub Issues](https://github.com/llamastack/llama-stack/issues)",
|
|
"x-displayName": "Agents"
|
|
},
|
|
{
|
|
"name": "Benchmarks",
|
|
"description": ""
|
|
},
|
|
{
|
|
"name": "DatasetIO",
|
|
"description": ""
|
|
},
|
|
{
|
|
"name": "Datasets",
|
|
"description": ""
|
|
},
|
|
{
|
|
"name": "Eval",
|
|
"description": "Llama Stack Evaluation API for running evaluations on model and agent candidates.",
|
|
"x-displayName": "Evaluations"
|
|
},
|
|
{
|
|
"name": "PostTraining (Coming Soon)",
|
|
"description": ""
|
|
}
|
|
],
|
|
"x-tagGroups": [
|
|
{
|
|
"name": "Operations",
|
|
"tags": [
|
|
"Agents",
|
|
"Benchmarks",
|
|
"DatasetIO",
|
|
"Datasets",
|
|
"Eval",
|
|
"PostTraining (Coming Soon)"
|
|
]
|
|
}
|
|
]
|
|
};
|
|
const element = document.getElementById("openapi-container");
|
|
element.apiDescriptionDocument = spec;
|
|
|
|
if (spec.info && spec.info.title) {
|
|
document.title = spec.info.title;
|
|
}
|
|
});
|
|
</script>
|
|
</body>
|
|
|
|
</html>
|