forked from phoenix-oss/llama-stack-mirror
# What does this PR do? Cleans up how we provide sampling params. Earlier, strategy was an enum and all params (top_p, temperature, top_k) across all strategies were grouped. We now have a strategy union object with each strategy (greedy, top_p, top_k) having its corresponding params. Earlier, ``` class SamplingParams: strategy: enum () top_p, temperature, top_k and other params ``` However, the `strategy` field was not being used in any providers making it confusing to know the exact sampling behavior purely based on the params since you could pass temperature, top_p, top_k and how the provider would interpret those would not be clear. Hence we introduced -- a union where the strategy and relevant params are all clubbed together to avoid this confusion. Have updated all providers, tests, notebooks, readme and otehr places where sampling params was being used to use the new format. ## Test Plan `pytest llama_stack/providers/tests/inference/groq/test_groq_utils.py` // inference on ollama, fireworks and together `with-proxy pytest -v -s -k "ollama" --inference-model="meta-llama/Llama-3.1-8B-Instruct" llama_stack/providers/tests/inference/test_text_inference.py ` // agents on fireworks `pytest -v -s -k 'fireworks and create_agent' --inference-model="meta-llama/Llama-3.1-8B-Instruct" llama_stack/providers/tests/agents/test_agents.py --safety-shield="meta-llama/Llama-Guard-3-8B"` ## Before submitting - [ ] This PR fixes a typo or improves the docs (you can dismiss the other checks if that's the case). - [X] Ran pre-commit to handle lint / formatting issues. - [X] Read the [contributor guideline](https://github.com/meta-llama/llama-stack/blob/main/CONTRIBUTING.md), Pull Request section? - [X] Updated relevant documentation. - [X] Wrote necessary unit or integration tests. --------- Co-authored-by: Hardik Shah <hjshah@fb.com>
6136 lines
166 KiB
YAML
6136 lines
166 KiB
YAML
components:
|
|
responses: {}
|
|
schemas:
|
|
AgentCandidate:
|
|
additionalProperties: false
|
|
properties:
|
|
config:
|
|
$ref: '#/components/schemas/AgentConfig'
|
|
type:
|
|
const: agent
|
|
default: agent
|
|
type: string
|
|
required:
|
|
- type
|
|
- config
|
|
type: object
|
|
AgentConfig:
|
|
additionalProperties: false
|
|
properties:
|
|
client_tools:
|
|
items:
|
|
$ref: '#/components/schemas/ToolDef'
|
|
type: array
|
|
enable_session_persistence:
|
|
type: boolean
|
|
input_shields:
|
|
items:
|
|
type: string
|
|
type: array
|
|
instructions:
|
|
type: string
|
|
max_infer_iters:
|
|
default: 10
|
|
type: integer
|
|
model:
|
|
type: string
|
|
output_shields:
|
|
items:
|
|
type: string
|
|
type: array
|
|
sampling_params:
|
|
$ref: '#/components/schemas/SamplingParams'
|
|
tool_choice:
|
|
$ref: '#/components/schemas/ToolChoice'
|
|
default: auto
|
|
tool_prompt_format:
|
|
$ref: '#/components/schemas/ToolPromptFormat'
|
|
default: json
|
|
toolgroups:
|
|
items:
|
|
$ref: '#/components/schemas/AgentTool'
|
|
type: array
|
|
required:
|
|
- max_infer_iters
|
|
- model
|
|
- instructions
|
|
- enable_session_persistence
|
|
type: object
|
|
AgentCreateResponse:
|
|
additionalProperties: false
|
|
properties:
|
|
agent_id:
|
|
type: string
|
|
required:
|
|
- agent_id
|
|
type: object
|
|
AgentSessionCreateResponse:
|
|
additionalProperties: false
|
|
properties:
|
|
session_id:
|
|
type: string
|
|
required:
|
|
- session_id
|
|
type: object
|
|
AgentStepResponse:
|
|
additionalProperties: false
|
|
properties:
|
|
step:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/InferenceStep'
|
|
- $ref: '#/components/schemas/ToolExecutionStep'
|
|
- $ref: '#/components/schemas/ShieldCallStep'
|
|
- $ref: '#/components/schemas/MemoryRetrievalStep'
|
|
required:
|
|
- step
|
|
type: object
|
|
AgentTool:
|
|
oneOf:
|
|
- type: string
|
|
- additionalProperties: false
|
|
properties:
|
|
args:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
name:
|
|
type: string
|
|
required:
|
|
- name
|
|
- args
|
|
type: object
|
|
AgentTurnResponseEvent:
|
|
additionalProperties: false
|
|
properties:
|
|
payload:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/AgentTurnResponseStepStartPayload'
|
|
- $ref: '#/components/schemas/AgentTurnResponseStepProgressPayload'
|
|
- $ref: '#/components/schemas/AgentTurnResponseStepCompletePayload'
|
|
- $ref: '#/components/schemas/AgentTurnResponseTurnStartPayload'
|
|
- $ref: '#/components/schemas/AgentTurnResponseTurnCompletePayload'
|
|
required:
|
|
- payload
|
|
title: Streamed agent execution response.
|
|
type: object
|
|
AgentTurnResponseStepCompletePayload:
|
|
additionalProperties: false
|
|
properties:
|
|
event_type:
|
|
const: step_complete
|
|
default: step_complete
|
|
type: string
|
|
step_details:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/InferenceStep'
|
|
- $ref: '#/components/schemas/ToolExecutionStep'
|
|
- $ref: '#/components/schemas/ShieldCallStep'
|
|
- $ref: '#/components/schemas/MemoryRetrievalStep'
|
|
step_id:
|
|
type: string
|
|
step_type:
|
|
enum:
|
|
- inference
|
|
- tool_execution
|
|
- shield_call
|
|
- memory_retrieval
|
|
type: string
|
|
required:
|
|
- event_type
|
|
- step_type
|
|
- step_id
|
|
- step_details
|
|
type: object
|
|
AgentTurnResponseStepProgressPayload:
|
|
additionalProperties: false
|
|
properties:
|
|
delta:
|
|
$ref: '#/components/schemas/ContentDelta'
|
|
event_type:
|
|
const: step_progress
|
|
default: step_progress
|
|
type: string
|
|
step_id:
|
|
type: string
|
|
step_type:
|
|
enum:
|
|
- inference
|
|
- tool_execution
|
|
- shield_call
|
|
- memory_retrieval
|
|
type: string
|
|
required:
|
|
- event_type
|
|
- step_type
|
|
- step_id
|
|
- delta
|
|
type: object
|
|
AgentTurnResponseStepStartPayload:
|
|
additionalProperties: false
|
|
properties:
|
|
event_type:
|
|
const: step_start
|
|
default: step_start
|
|
type: string
|
|
metadata:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
step_id:
|
|
type: string
|
|
step_type:
|
|
enum:
|
|
- inference
|
|
- tool_execution
|
|
- shield_call
|
|
- memory_retrieval
|
|
type: string
|
|
required:
|
|
- event_type
|
|
- step_type
|
|
- step_id
|
|
type: object
|
|
AgentTurnResponseStreamChunk:
|
|
additionalProperties: false
|
|
properties:
|
|
event:
|
|
$ref: '#/components/schemas/AgentTurnResponseEvent'
|
|
required:
|
|
- event
|
|
title: streamed agent turn completion response.
|
|
type: object
|
|
AgentTurnResponseTurnCompletePayload:
|
|
additionalProperties: false
|
|
properties:
|
|
event_type:
|
|
const: turn_complete
|
|
default: turn_complete
|
|
type: string
|
|
turn:
|
|
$ref: '#/components/schemas/Turn'
|
|
required:
|
|
- event_type
|
|
- turn
|
|
type: object
|
|
AgentTurnResponseTurnStartPayload:
|
|
additionalProperties: false
|
|
properties:
|
|
event_type:
|
|
const: turn_start
|
|
default: turn_start
|
|
type: string
|
|
turn_id:
|
|
type: string
|
|
required:
|
|
- event_type
|
|
- turn_id
|
|
type: object
|
|
AggregationFunctionType:
|
|
enum:
|
|
- average
|
|
- median
|
|
- categorical_count
|
|
- accuracy
|
|
type: string
|
|
AppEvalTaskConfig:
|
|
additionalProperties: false
|
|
properties:
|
|
eval_candidate:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/ModelCandidate'
|
|
- $ref: '#/components/schemas/AgentCandidate'
|
|
num_examples:
|
|
type: integer
|
|
scoring_params:
|
|
additionalProperties:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/LLMAsJudgeScoringFnParams'
|
|
- $ref: '#/components/schemas/RegexParserScoringFnParams'
|
|
- $ref: '#/components/schemas/BasicScoringFnParams'
|
|
type: object
|
|
type:
|
|
const: app
|
|
default: app
|
|
type: string
|
|
required:
|
|
- type
|
|
- eval_candidate
|
|
- scoring_params
|
|
type: object
|
|
AppendRowsRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
dataset_id:
|
|
type: string
|
|
rows:
|
|
items:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
type: array
|
|
required:
|
|
- dataset_id
|
|
- rows
|
|
type: object
|
|
BasicScoringFnParams:
|
|
additionalProperties: false
|
|
properties:
|
|
aggregation_functions:
|
|
items:
|
|
$ref: '#/components/schemas/AggregationFunctionType'
|
|
type: array
|
|
type:
|
|
const: basic
|
|
default: basic
|
|
type: string
|
|
required:
|
|
- type
|
|
type: object
|
|
BatchChatCompletionRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
logprobs:
|
|
additionalProperties: false
|
|
properties:
|
|
top_k:
|
|
default: 0
|
|
type: integer
|
|
type: object
|
|
messages_batch:
|
|
items:
|
|
items:
|
|
$ref: '#/components/schemas/Message'
|
|
type: array
|
|
type: array
|
|
model:
|
|
type: string
|
|
sampling_params:
|
|
$ref: '#/components/schemas/SamplingParams'
|
|
tool_choice:
|
|
$ref: '#/components/schemas/ToolChoice'
|
|
tool_prompt_format:
|
|
$ref: '#/components/schemas/ToolPromptFormat'
|
|
tools:
|
|
items:
|
|
$ref: '#/components/schemas/ToolDefinition'
|
|
type: array
|
|
required:
|
|
- model
|
|
- messages_batch
|
|
type: object
|
|
BatchChatCompletionResponse:
|
|
additionalProperties: false
|
|
properties:
|
|
completion_message_batch:
|
|
items:
|
|
$ref: '#/components/schemas/CompletionMessage'
|
|
type: array
|
|
required:
|
|
- completion_message_batch
|
|
type: object
|
|
BatchCompletionRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
content_batch:
|
|
items:
|
|
$ref: '#/components/schemas/InterleavedContent'
|
|
type: array
|
|
logprobs:
|
|
additionalProperties: false
|
|
properties:
|
|
top_k:
|
|
default: 0
|
|
type: integer
|
|
type: object
|
|
model:
|
|
type: string
|
|
sampling_params:
|
|
$ref: '#/components/schemas/SamplingParams'
|
|
required:
|
|
- model
|
|
- content_batch
|
|
type: object
|
|
BatchCompletionResponse:
|
|
additionalProperties: false
|
|
properties:
|
|
completion_message_batch:
|
|
items:
|
|
$ref: '#/components/schemas/CompletionMessage'
|
|
type: array
|
|
required:
|
|
- completion_message_batch
|
|
type: object
|
|
BenchmarkEvalTaskConfig:
|
|
additionalProperties: false
|
|
properties:
|
|
eval_candidate:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/ModelCandidate'
|
|
- $ref: '#/components/schemas/AgentCandidate'
|
|
num_examples:
|
|
type: integer
|
|
type:
|
|
const: benchmark
|
|
default: benchmark
|
|
type: string
|
|
required:
|
|
- type
|
|
- eval_candidate
|
|
type: object
|
|
BuiltinTool:
|
|
enum:
|
|
- brave_search
|
|
- wolfram_alpha
|
|
- photogen
|
|
- code_interpreter
|
|
type: string
|
|
CancelTrainingJobRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
job_uuid:
|
|
type: string
|
|
required:
|
|
- job_uuid
|
|
type: object
|
|
ChatCompletionRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
logprobs:
|
|
additionalProperties: false
|
|
properties:
|
|
top_k:
|
|
default: 0
|
|
type: integer
|
|
type: object
|
|
messages:
|
|
items:
|
|
$ref: '#/components/schemas/Message'
|
|
type: array
|
|
model_id:
|
|
type: string
|
|
response_format:
|
|
$ref: '#/components/schemas/ResponseFormat'
|
|
sampling_params:
|
|
$ref: '#/components/schemas/SamplingParams'
|
|
stream:
|
|
type: boolean
|
|
tool_choice:
|
|
$ref: '#/components/schemas/ToolChoice'
|
|
tool_prompt_format:
|
|
$ref: '#/components/schemas/ToolPromptFormat'
|
|
tools:
|
|
items:
|
|
$ref: '#/components/schemas/ToolDefinition'
|
|
type: array
|
|
required:
|
|
- model_id
|
|
- messages
|
|
type: object
|
|
ChatCompletionResponse:
|
|
additionalProperties: false
|
|
properties:
|
|
completion_message:
|
|
$ref: '#/components/schemas/CompletionMessage'
|
|
logprobs:
|
|
items:
|
|
$ref: '#/components/schemas/TokenLogProbs'
|
|
type: array
|
|
required:
|
|
- completion_message
|
|
title: Chat completion response.
|
|
type: object
|
|
ChatCompletionResponseEvent:
|
|
additionalProperties: false
|
|
properties:
|
|
delta:
|
|
$ref: '#/components/schemas/ContentDelta'
|
|
event_type:
|
|
$ref: '#/components/schemas/ChatCompletionResponseEventType'
|
|
logprobs:
|
|
items:
|
|
$ref: '#/components/schemas/TokenLogProbs'
|
|
type: array
|
|
stop_reason:
|
|
$ref: '#/components/schemas/StopReason'
|
|
required:
|
|
- event_type
|
|
- delta
|
|
title: Chat completion response event.
|
|
type: object
|
|
ChatCompletionResponseEventType:
|
|
enum:
|
|
- start
|
|
- complete
|
|
- progress
|
|
type: string
|
|
ChatCompletionResponseStreamChunk:
|
|
additionalProperties: false
|
|
properties:
|
|
event:
|
|
$ref: '#/components/schemas/ChatCompletionResponseEvent'
|
|
required:
|
|
- event
|
|
title: SSE-stream of these events.
|
|
type: object
|
|
Checkpoint:
|
|
description: Checkpoint created during training runs
|
|
CompletionMessage:
|
|
additionalProperties: false
|
|
properties:
|
|
content:
|
|
$ref: '#/components/schemas/InterleavedContent'
|
|
role:
|
|
const: assistant
|
|
default: assistant
|
|
type: string
|
|
stop_reason:
|
|
$ref: '#/components/schemas/StopReason'
|
|
tool_calls:
|
|
items:
|
|
$ref: '#/components/schemas/ToolCall'
|
|
type: array
|
|
required:
|
|
- role
|
|
- content
|
|
- stop_reason
|
|
- tool_calls
|
|
type: object
|
|
CompletionRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
content:
|
|
$ref: '#/components/schemas/InterleavedContent'
|
|
logprobs:
|
|
additionalProperties: false
|
|
properties:
|
|
top_k:
|
|
default: 0
|
|
type: integer
|
|
type: object
|
|
model_id:
|
|
type: string
|
|
response_format:
|
|
$ref: '#/components/schemas/ResponseFormat'
|
|
sampling_params:
|
|
$ref: '#/components/schemas/SamplingParams'
|
|
stream:
|
|
type: boolean
|
|
required:
|
|
- model_id
|
|
- content
|
|
type: object
|
|
CompletionResponse:
|
|
additionalProperties: false
|
|
properties:
|
|
content:
|
|
type: string
|
|
logprobs:
|
|
items:
|
|
$ref: '#/components/schemas/TokenLogProbs'
|
|
type: array
|
|
stop_reason:
|
|
$ref: '#/components/schemas/StopReason'
|
|
required:
|
|
- content
|
|
- stop_reason
|
|
title: Completion response.
|
|
type: object
|
|
CompletionResponseStreamChunk:
|
|
additionalProperties: false
|
|
properties:
|
|
delta:
|
|
type: string
|
|
logprobs:
|
|
items:
|
|
$ref: '#/components/schemas/TokenLogProbs'
|
|
type: array
|
|
stop_reason:
|
|
$ref: '#/components/schemas/StopReason'
|
|
required:
|
|
- delta
|
|
title: streamed completion response.
|
|
type: object
|
|
ContentDelta:
|
|
oneOf:
|
|
- additionalProperties: false
|
|
properties:
|
|
text:
|
|
type: string
|
|
type:
|
|
const: text
|
|
default: text
|
|
type: string
|
|
required:
|
|
- type
|
|
- text
|
|
type: object
|
|
- additionalProperties: false
|
|
properties:
|
|
data:
|
|
contentEncoding: base64
|
|
type: string
|
|
type:
|
|
const: image
|
|
default: image
|
|
type: string
|
|
required:
|
|
- type
|
|
- data
|
|
type: object
|
|
- $ref: '#/components/schemas/ToolCallDelta'
|
|
CreateAgentRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
agent_config:
|
|
$ref: '#/components/schemas/AgentConfig'
|
|
required:
|
|
- agent_config
|
|
type: object
|
|
CreateAgentSessionRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
agent_id:
|
|
type: string
|
|
session_name:
|
|
type: string
|
|
required:
|
|
- agent_id
|
|
- session_name
|
|
type: object
|
|
CreateAgentTurnRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
agent_id:
|
|
type: string
|
|
documents:
|
|
items:
|
|
additionalProperties: false
|
|
properties:
|
|
content:
|
|
oneOf:
|
|
- type: string
|
|
- $ref: '#/components/schemas/InterleavedContentItem'
|
|
- items:
|
|
$ref: '#/components/schemas/InterleavedContentItem'
|
|
type: array
|
|
- $ref: '#/components/schemas/URL'
|
|
mime_type:
|
|
type: string
|
|
required:
|
|
- content
|
|
- mime_type
|
|
type: object
|
|
type: array
|
|
messages:
|
|
items:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/UserMessage'
|
|
- $ref: '#/components/schemas/ToolResponseMessage'
|
|
type: array
|
|
session_id:
|
|
type: string
|
|
stream:
|
|
type: boolean
|
|
toolgroups:
|
|
items:
|
|
$ref: '#/components/schemas/AgentTool'
|
|
type: array
|
|
required:
|
|
- agent_id
|
|
- session_id
|
|
- messages
|
|
type: object
|
|
DPOAlignmentConfig:
|
|
additionalProperties: false
|
|
properties:
|
|
epsilon:
|
|
type: number
|
|
gamma:
|
|
type: number
|
|
reward_clip:
|
|
type: number
|
|
reward_scale:
|
|
type: number
|
|
required:
|
|
- reward_scale
|
|
- reward_clip
|
|
- epsilon
|
|
- gamma
|
|
type: object
|
|
DataConfig:
|
|
additionalProperties: false
|
|
properties:
|
|
batch_size:
|
|
type: integer
|
|
dataset_id:
|
|
type: string
|
|
packed:
|
|
default: false
|
|
type: boolean
|
|
shuffle:
|
|
type: boolean
|
|
train_on_input:
|
|
default: false
|
|
type: boolean
|
|
validation_dataset_id:
|
|
type: string
|
|
required:
|
|
- dataset_id
|
|
- batch_size
|
|
- shuffle
|
|
type: object
|
|
Dataset:
|
|
additionalProperties: false
|
|
properties:
|
|
dataset_schema:
|
|
additionalProperties:
|
|
$ref: '#/components/schemas/ParamType'
|
|
type: object
|
|
identifier:
|
|
type: string
|
|
metadata:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
provider_id:
|
|
type: string
|
|
provider_resource_id:
|
|
type: string
|
|
type:
|
|
const: dataset
|
|
default: dataset
|
|
type: string
|
|
url:
|
|
$ref: '#/components/schemas/URL'
|
|
required:
|
|
- identifier
|
|
- provider_resource_id
|
|
- provider_id
|
|
- type
|
|
- dataset_schema
|
|
- url
|
|
- metadata
|
|
type: object
|
|
DeleteAgentsRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
agent_id:
|
|
type: string
|
|
required:
|
|
- agent_id
|
|
type: object
|
|
DeleteAgentsSessionRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
agent_id:
|
|
type: string
|
|
session_id:
|
|
type: string
|
|
required:
|
|
- agent_id
|
|
- session_id
|
|
type: object
|
|
EfficiencyConfig:
|
|
additionalProperties: false
|
|
properties:
|
|
enable_activation_checkpointing:
|
|
default: false
|
|
type: boolean
|
|
enable_activation_offloading:
|
|
default: false
|
|
type: boolean
|
|
fsdp_cpu_offload:
|
|
default: false
|
|
type: boolean
|
|
memory_efficient_fsdp_wrap:
|
|
default: false
|
|
type: boolean
|
|
type: object
|
|
EmbeddingsRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
contents:
|
|
items:
|
|
$ref: '#/components/schemas/InterleavedContent'
|
|
type: array
|
|
model_id:
|
|
type: string
|
|
required:
|
|
- model_id
|
|
- contents
|
|
type: object
|
|
EmbeddingsResponse:
|
|
additionalProperties: false
|
|
properties:
|
|
embeddings:
|
|
items:
|
|
items:
|
|
type: number
|
|
type: array
|
|
type: array
|
|
required:
|
|
- embeddings
|
|
type: object
|
|
EvalTask:
|
|
additionalProperties: false
|
|
properties:
|
|
dataset_id:
|
|
type: string
|
|
identifier:
|
|
type: string
|
|
metadata:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
provider_id:
|
|
type: string
|
|
provider_resource_id:
|
|
type: string
|
|
scoring_functions:
|
|
items:
|
|
type: string
|
|
type: array
|
|
type:
|
|
const: eval_task
|
|
default: eval_task
|
|
type: string
|
|
required:
|
|
- identifier
|
|
- provider_resource_id
|
|
- provider_id
|
|
- type
|
|
- dataset_id
|
|
- scoring_functions
|
|
- metadata
|
|
type: object
|
|
EvaluateResponse:
|
|
additionalProperties: false
|
|
properties:
|
|
generations:
|
|
items:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
type: array
|
|
scores:
|
|
additionalProperties:
|
|
$ref: '#/components/schemas/ScoringResult'
|
|
type: object
|
|
required:
|
|
- generations
|
|
- scores
|
|
type: object
|
|
EvaluateRowsRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
input_rows:
|
|
items:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
type: array
|
|
scoring_functions:
|
|
items:
|
|
type: string
|
|
type: array
|
|
task_config:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/BenchmarkEvalTaskConfig'
|
|
- $ref: '#/components/schemas/AppEvalTaskConfig'
|
|
task_id:
|
|
type: string
|
|
required:
|
|
- task_id
|
|
- input_rows
|
|
- scoring_functions
|
|
- task_config
|
|
type: object
|
|
GetAgentsSessionRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
turn_ids:
|
|
items:
|
|
type: string
|
|
type: array
|
|
type: object
|
|
GetSpanTreeRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
attributes_to_return:
|
|
items:
|
|
type: string
|
|
type: array
|
|
type: object
|
|
GraphMemoryBank:
|
|
additionalProperties: false
|
|
properties:
|
|
identifier:
|
|
type: string
|
|
memory_bank_type:
|
|
const: graph
|
|
default: graph
|
|
type: string
|
|
provider_id:
|
|
type: string
|
|
provider_resource_id:
|
|
type: string
|
|
type:
|
|
const: memory_bank
|
|
default: memory_bank
|
|
type: string
|
|
required:
|
|
- identifier
|
|
- provider_resource_id
|
|
- provider_id
|
|
- type
|
|
- memory_bank_type
|
|
type: object
|
|
GraphMemoryBankParams:
|
|
additionalProperties: false
|
|
properties:
|
|
memory_bank_type:
|
|
const: graph
|
|
default: graph
|
|
type: string
|
|
required:
|
|
- memory_bank_type
|
|
type: object
|
|
GreedySamplingStrategy:
|
|
additionalProperties: false
|
|
properties:
|
|
type:
|
|
const: greedy
|
|
default: greedy
|
|
type: string
|
|
required:
|
|
- type
|
|
type: object
|
|
HealthInfo:
|
|
additionalProperties: false
|
|
properties:
|
|
status:
|
|
type: string
|
|
required:
|
|
- status
|
|
type: object
|
|
ImageContentItem:
|
|
additionalProperties: false
|
|
properties:
|
|
data:
|
|
contentEncoding: base64
|
|
type: string
|
|
type:
|
|
const: image
|
|
default: image
|
|
type: string
|
|
url:
|
|
$ref: '#/components/schemas/URL'
|
|
required:
|
|
- type
|
|
type: object
|
|
InferenceStep:
|
|
additionalProperties: false
|
|
properties:
|
|
completed_at:
|
|
format: date-time
|
|
type: string
|
|
model_response:
|
|
$ref: '#/components/schemas/CompletionMessage'
|
|
started_at:
|
|
format: date-time
|
|
type: string
|
|
step_id:
|
|
type: string
|
|
step_type:
|
|
const: inference
|
|
default: inference
|
|
type: string
|
|
turn_id:
|
|
type: string
|
|
required:
|
|
- turn_id
|
|
- step_id
|
|
- step_type
|
|
- model_response
|
|
type: object
|
|
InsertDocumentsRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
bank_id:
|
|
type: string
|
|
documents:
|
|
items:
|
|
$ref: '#/components/schemas/MemoryBankDocument'
|
|
type: array
|
|
ttl_seconds:
|
|
type: integer
|
|
required:
|
|
- bank_id
|
|
- documents
|
|
type: object
|
|
InterleavedContent:
|
|
oneOf:
|
|
- type: string
|
|
- $ref: '#/components/schemas/InterleavedContentItem'
|
|
- items:
|
|
$ref: '#/components/schemas/InterleavedContentItem'
|
|
type: array
|
|
InterleavedContentItem:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/ImageContentItem'
|
|
- $ref: '#/components/schemas/TextContentItem'
|
|
InvokeToolRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
args:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
tool_name:
|
|
type: string
|
|
required:
|
|
- tool_name
|
|
- args
|
|
type: object
|
|
Job:
|
|
additionalProperties: false
|
|
properties:
|
|
job_id:
|
|
type: string
|
|
required:
|
|
- job_id
|
|
type: object
|
|
JobCancelRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
job_id:
|
|
type: string
|
|
task_id:
|
|
type: string
|
|
required:
|
|
- task_id
|
|
- job_id
|
|
type: object
|
|
JobStatus:
|
|
enum:
|
|
- completed
|
|
- in_progress
|
|
- failed
|
|
- scheduled
|
|
type: string
|
|
KeyValueMemoryBank:
|
|
additionalProperties: false
|
|
properties:
|
|
identifier:
|
|
type: string
|
|
memory_bank_type:
|
|
const: keyvalue
|
|
default: keyvalue
|
|
type: string
|
|
provider_id:
|
|
type: string
|
|
provider_resource_id:
|
|
type: string
|
|
type:
|
|
const: memory_bank
|
|
default: memory_bank
|
|
type: string
|
|
required:
|
|
- identifier
|
|
- provider_resource_id
|
|
- provider_id
|
|
- type
|
|
- memory_bank_type
|
|
type: object
|
|
KeyValueMemoryBankParams:
|
|
additionalProperties: false
|
|
properties:
|
|
memory_bank_type:
|
|
const: keyvalue
|
|
default: keyvalue
|
|
type: string
|
|
required:
|
|
- memory_bank_type
|
|
type: object
|
|
KeywordMemoryBank:
|
|
additionalProperties: false
|
|
properties:
|
|
identifier:
|
|
type: string
|
|
memory_bank_type:
|
|
const: keyword
|
|
default: keyword
|
|
type: string
|
|
provider_id:
|
|
type: string
|
|
provider_resource_id:
|
|
type: string
|
|
type:
|
|
const: memory_bank
|
|
default: memory_bank
|
|
type: string
|
|
required:
|
|
- identifier
|
|
- provider_resource_id
|
|
- provider_id
|
|
- type
|
|
- memory_bank_type
|
|
type: object
|
|
KeywordMemoryBankParams:
|
|
additionalProperties: false
|
|
properties:
|
|
memory_bank_type:
|
|
const: keyword
|
|
default: keyword
|
|
type: string
|
|
required:
|
|
- memory_bank_type
|
|
type: object
|
|
LLMAsJudgeScoringFnParams:
|
|
additionalProperties: false
|
|
properties:
|
|
aggregation_functions:
|
|
items:
|
|
$ref: '#/components/schemas/AggregationFunctionType'
|
|
type: array
|
|
judge_model:
|
|
type: string
|
|
judge_score_regexes:
|
|
items:
|
|
type: string
|
|
type: array
|
|
prompt_template:
|
|
type: string
|
|
type:
|
|
const: llm_as_judge
|
|
default: llm_as_judge
|
|
type: string
|
|
required:
|
|
- type
|
|
- judge_model
|
|
type: object
|
|
ListRuntimeToolsRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
mcp_endpoint:
|
|
$ref: '#/components/schemas/URL'
|
|
type: object
|
|
LogEventRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
event:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/UnstructuredLogEvent'
|
|
- $ref: '#/components/schemas/MetricEvent'
|
|
- $ref: '#/components/schemas/StructuredLogEvent'
|
|
ttl_seconds:
|
|
type: integer
|
|
required:
|
|
- event
|
|
- ttl_seconds
|
|
type: object
|
|
LogSeverity:
|
|
enum:
|
|
- verbose
|
|
- debug
|
|
- info
|
|
- warn
|
|
- error
|
|
- critical
|
|
type: string
|
|
LoraFinetuningConfig:
|
|
additionalProperties: false
|
|
properties:
|
|
alpha:
|
|
type: integer
|
|
apply_lora_to_mlp:
|
|
type: boolean
|
|
apply_lora_to_output:
|
|
type: boolean
|
|
lora_attn_modules:
|
|
items:
|
|
type: string
|
|
type: array
|
|
quantize_base:
|
|
default: false
|
|
type: boolean
|
|
rank:
|
|
type: integer
|
|
type:
|
|
const: LoRA
|
|
default: LoRA
|
|
type: string
|
|
use_dora:
|
|
default: false
|
|
type: boolean
|
|
required:
|
|
- type
|
|
- lora_attn_modules
|
|
- apply_lora_to_mlp
|
|
- apply_lora_to_output
|
|
- rank
|
|
- alpha
|
|
type: object
|
|
MemoryBankDocument:
|
|
additionalProperties: false
|
|
properties:
|
|
content:
|
|
oneOf:
|
|
- type: string
|
|
- $ref: '#/components/schemas/InterleavedContentItem'
|
|
- items:
|
|
$ref: '#/components/schemas/InterleavedContentItem'
|
|
type: array
|
|
- $ref: '#/components/schemas/URL'
|
|
document_id:
|
|
type: string
|
|
metadata:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
mime_type:
|
|
type: string
|
|
required:
|
|
- document_id
|
|
- content
|
|
- metadata
|
|
type: object
|
|
MemoryRetrievalStep:
|
|
additionalProperties: false
|
|
properties:
|
|
completed_at:
|
|
format: date-time
|
|
type: string
|
|
inserted_context:
|
|
$ref: '#/components/schemas/InterleavedContent'
|
|
memory_bank_ids:
|
|
items:
|
|
type: string
|
|
type: array
|
|
started_at:
|
|
format: date-time
|
|
type: string
|
|
step_id:
|
|
type: string
|
|
step_type:
|
|
const: memory_retrieval
|
|
default: memory_retrieval
|
|
type: string
|
|
turn_id:
|
|
type: string
|
|
required:
|
|
- turn_id
|
|
- step_id
|
|
- step_type
|
|
- memory_bank_ids
|
|
- inserted_context
|
|
type: object
|
|
Message:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/UserMessage'
|
|
- $ref: '#/components/schemas/SystemMessage'
|
|
- $ref: '#/components/schemas/ToolResponseMessage'
|
|
- $ref: '#/components/schemas/CompletionMessage'
|
|
MetricEvent:
|
|
additionalProperties: false
|
|
properties:
|
|
attributes:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
metric:
|
|
type: string
|
|
span_id:
|
|
type: string
|
|
timestamp:
|
|
format: date-time
|
|
type: string
|
|
trace_id:
|
|
type: string
|
|
type:
|
|
const: metric
|
|
default: metric
|
|
type: string
|
|
unit:
|
|
type: string
|
|
value:
|
|
oneOf:
|
|
- type: integer
|
|
- type: number
|
|
required:
|
|
- trace_id
|
|
- span_id
|
|
- timestamp
|
|
- type
|
|
- metric
|
|
- value
|
|
- unit
|
|
type: object
|
|
Model:
|
|
additionalProperties: false
|
|
properties:
|
|
identifier:
|
|
type: string
|
|
metadata:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
model_type:
|
|
$ref: '#/components/schemas/ModelType'
|
|
default: llm
|
|
provider_id:
|
|
type: string
|
|
provider_resource_id:
|
|
type: string
|
|
type:
|
|
const: model
|
|
default: model
|
|
type: string
|
|
required:
|
|
- identifier
|
|
- provider_resource_id
|
|
- provider_id
|
|
- type
|
|
- metadata
|
|
- model_type
|
|
type: object
|
|
ModelCandidate:
|
|
additionalProperties: false
|
|
properties:
|
|
model:
|
|
type: string
|
|
sampling_params:
|
|
$ref: '#/components/schemas/SamplingParams'
|
|
system_message:
|
|
$ref: '#/components/schemas/SystemMessage'
|
|
type:
|
|
const: model
|
|
default: model
|
|
type: string
|
|
required:
|
|
- type
|
|
- model
|
|
- sampling_params
|
|
type: object
|
|
ModelType:
|
|
enum:
|
|
- llm
|
|
- embedding
|
|
type: string
|
|
OptimizerConfig:
|
|
additionalProperties: false
|
|
properties:
|
|
lr:
|
|
type: number
|
|
num_warmup_steps:
|
|
type: integer
|
|
optimizer_type:
|
|
$ref: '#/components/schemas/OptimizerType'
|
|
weight_decay:
|
|
type: number
|
|
required:
|
|
- optimizer_type
|
|
- lr
|
|
- weight_decay
|
|
- num_warmup_steps
|
|
type: object
|
|
OptimizerType:
|
|
enum:
|
|
- adam
|
|
- adamw
|
|
- sgd
|
|
type: string
|
|
PaginatedRowsResult:
|
|
additionalProperties: false
|
|
properties:
|
|
next_page_token:
|
|
type: string
|
|
rows:
|
|
items:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
type: array
|
|
total_count:
|
|
type: integer
|
|
required:
|
|
- rows
|
|
- total_count
|
|
type: object
|
|
ParamType:
|
|
oneOf:
|
|
- additionalProperties: false
|
|
properties:
|
|
type:
|
|
const: string
|
|
default: string
|
|
type: string
|
|
required:
|
|
- type
|
|
type: object
|
|
- additionalProperties: false
|
|
properties:
|
|
type:
|
|
const: number
|
|
default: number
|
|
type: string
|
|
required:
|
|
- type
|
|
type: object
|
|
- additionalProperties: false
|
|
properties:
|
|
type:
|
|
const: boolean
|
|
default: boolean
|
|
type: string
|
|
required:
|
|
- type
|
|
type: object
|
|
- additionalProperties: false
|
|
properties:
|
|
type:
|
|
const: array
|
|
default: array
|
|
type: string
|
|
required:
|
|
- type
|
|
type: object
|
|
- additionalProperties: false
|
|
properties:
|
|
type:
|
|
const: object
|
|
default: object
|
|
type: string
|
|
required:
|
|
- type
|
|
type: object
|
|
- additionalProperties: false
|
|
properties:
|
|
type:
|
|
const: json
|
|
default: json
|
|
type: string
|
|
required:
|
|
- type
|
|
type: object
|
|
- additionalProperties: false
|
|
properties:
|
|
type:
|
|
const: union
|
|
default: union
|
|
type: string
|
|
required:
|
|
- type
|
|
type: object
|
|
- additionalProperties: false
|
|
properties:
|
|
type:
|
|
const: chat_completion_input
|
|
default: chat_completion_input
|
|
type: string
|
|
required:
|
|
- type
|
|
type: object
|
|
- additionalProperties: false
|
|
properties:
|
|
type:
|
|
const: completion_input
|
|
default: completion_input
|
|
type: string
|
|
required:
|
|
- type
|
|
type: object
|
|
- additionalProperties: false
|
|
properties:
|
|
type:
|
|
const: agent_turn_input
|
|
default: agent_turn_input
|
|
type: string
|
|
required:
|
|
- type
|
|
type: object
|
|
PostTrainingJob:
|
|
additionalProperties: false
|
|
properties:
|
|
job_uuid:
|
|
type: string
|
|
required:
|
|
- job_uuid
|
|
type: object
|
|
PostTrainingJobArtifactsResponse:
|
|
additionalProperties: false
|
|
properties:
|
|
checkpoints:
|
|
items:
|
|
$ref: '#/components/schemas/Checkpoint'
|
|
type: array
|
|
job_uuid:
|
|
type: string
|
|
required:
|
|
- job_uuid
|
|
- checkpoints
|
|
title: Artifacts of a finetuning job.
|
|
type: object
|
|
PostTrainingJobStatusResponse:
|
|
additionalProperties: false
|
|
properties:
|
|
checkpoints:
|
|
items:
|
|
$ref: '#/components/schemas/Checkpoint'
|
|
type: array
|
|
completed_at:
|
|
format: date-time
|
|
type: string
|
|
job_uuid:
|
|
type: string
|
|
resources_allocated:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
scheduled_at:
|
|
format: date-time
|
|
type: string
|
|
started_at:
|
|
format: date-time
|
|
type: string
|
|
status:
|
|
$ref: '#/components/schemas/JobStatus'
|
|
required:
|
|
- job_uuid
|
|
- status
|
|
- checkpoints
|
|
title: Status of a finetuning job.
|
|
type: object
|
|
PreferenceOptimizeRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
algorithm_config:
|
|
$ref: '#/components/schemas/DPOAlignmentConfig'
|
|
finetuned_model:
|
|
type: string
|
|
hyperparam_search_config:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
job_uuid:
|
|
type: string
|
|
logger_config:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
training_config:
|
|
$ref: '#/components/schemas/TrainingConfig'
|
|
required:
|
|
- job_uuid
|
|
- finetuned_model
|
|
- algorithm_config
|
|
- training_config
|
|
- hyperparam_search_config
|
|
- logger_config
|
|
type: object
|
|
ProviderInfo:
|
|
additionalProperties: false
|
|
properties:
|
|
provider_id:
|
|
type: string
|
|
provider_type:
|
|
type: string
|
|
required:
|
|
- provider_id
|
|
- provider_type
|
|
type: object
|
|
QATFinetuningConfig:
|
|
additionalProperties: false
|
|
properties:
|
|
group_size:
|
|
type: integer
|
|
quantizer_name:
|
|
type: string
|
|
type:
|
|
const: QAT
|
|
default: QAT
|
|
type: string
|
|
required:
|
|
- type
|
|
- quantizer_name
|
|
- group_size
|
|
type: object
|
|
QueryCondition:
|
|
additionalProperties: false
|
|
properties:
|
|
key:
|
|
type: string
|
|
op:
|
|
$ref: '#/components/schemas/QueryConditionOp'
|
|
value:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
required:
|
|
- key
|
|
- op
|
|
- value
|
|
type: object
|
|
QueryConditionOp:
|
|
enum:
|
|
- eq
|
|
- ne
|
|
- gt
|
|
- lt
|
|
type: string
|
|
QueryDocumentsRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
bank_id:
|
|
type: string
|
|
params:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
query:
|
|
$ref: '#/components/schemas/InterleavedContent'
|
|
required:
|
|
- bank_id
|
|
- query
|
|
type: object
|
|
QueryDocumentsResponse:
|
|
additionalProperties: false
|
|
properties:
|
|
chunks:
|
|
items:
|
|
additionalProperties: false
|
|
properties:
|
|
content:
|
|
$ref: '#/components/schemas/InterleavedContent'
|
|
document_id:
|
|
type: string
|
|
token_count:
|
|
type: integer
|
|
required:
|
|
- content
|
|
- token_count
|
|
- document_id
|
|
type: object
|
|
type: array
|
|
scores:
|
|
items:
|
|
type: number
|
|
type: array
|
|
required:
|
|
- chunks
|
|
- scores
|
|
type: object
|
|
QuerySpansRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
attribute_filters:
|
|
items:
|
|
$ref: '#/components/schemas/QueryCondition'
|
|
type: array
|
|
attributes_to_return:
|
|
items:
|
|
type: string
|
|
type: array
|
|
max_depth:
|
|
type: integer
|
|
required:
|
|
- attribute_filters
|
|
- attributes_to_return
|
|
type: object
|
|
QueryTracesRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
attribute_filters:
|
|
items:
|
|
$ref: '#/components/schemas/QueryCondition'
|
|
type: array
|
|
limit:
|
|
type: integer
|
|
offset:
|
|
type: integer
|
|
order_by:
|
|
items:
|
|
type: string
|
|
type: array
|
|
type: object
|
|
RegexParserScoringFnParams:
|
|
additionalProperties: false
|
|
properties:
|
|
aggregation_functions:
|
|
items:
|
|
$ref: '#/components/schemas/AggregationFunctionType'
|
|
type: array
|
|
parsing_regexes:
|
|
items:
|
|
type: string
|
|
type: array
|
|
type:
|
|
const: regex_parser
|
|
default: regex_parser
|
|
type: string
|
|
required:
|
|
- type
|
|
type: object
|
|
RegisterDatasetRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
dataset_id:
|
|
type: string
|
|
dataset_schema:
|
|
additionalProperties:
|
|
$ref: '#/components/schemas/ParamType'
|
|
type: object
|
|
metadata:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
provider_dataset_id:
|
|
type: string
|
|
provider_id:
|
|
type: string
|
|
url:
|
|
$ref: '#/components/schemas/URL'
|
|
required:
|
|
- dataset_id
|
|
- dataset_schema
|
|
- url
|
|
type: object
|
|
RegisterEvalTaskRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
dataset_id:
|
|
type: string
|
|
eval_task_id:
|
|
type: string
|
|
metadata:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
provider_eval_task_id:
|
|
type: string
|
|
provider_id:
|
|
type: string
|
|
scoring_functions:
|
|
items:
|
|
type: string
|
|
type: array
|
|
required:
|
|
- eval_task_id
|
|
- dataset_id
|
|
- scoring_functions
|
|
type: object
|
|
RegisterMemoryBankRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
memory_bank_id:
|
|
type: string
|
|
params:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/VectorMemoryBankParams'
|
|
- $ref: '#/components/schemas/KeyValueMemoryBankParams'
|
|
- $ref: '#/components/schemas/KeywordMemoryBankParams'
|
|
- $ref: '#/components/schemas/GraphMemoryBankParams'
|
|
provider_id:
|
|
type: string
|
|
provider_memory_bank_id:
|
|
type: string
|
|
required:
|
|
- memory_bank_id
|
|
- params
|
|
type: object
|
|
RegisterModelRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
metadata:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
model_id:
|
|
type: string
|
|
model_type:
|
|
$ref: '#/components/schemas/ModelType'
|
|
provider_id:
|
|
type: string
|
|
provider_model_id:
|
|
type: string
|
|
required:
|
|
- model_id
|
|
type: object
|
|
RegisterScoringFunctionRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
description:
|
|
type: string
|
|
params:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/LLMAsJudgeScoringFnParams'
|
|
- $ref: '#/components/schemas/RegexParserScoringFnParams'
|
|
- $ref: '#/components/schemas/BasicScoringFnParams'
|
|
provider_id:
|
|
type: string
|
|
provider_scoring_fn_id:
|
|
type: string
|
|
return_type:
|
|
$ref: '#/components/schemas/ParamType'
|
|
scoring_fn_id:
|
|
type: string
|
|
required:
|
|
- scoring_fn_id
|
|
- description
|
|
- return_type
|
|
type: object
|
|
RegisterShieldRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
params:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
provider_id:
|
|
type: string
|
|
provider_shield_id:
|
|
type: string
|
|
shield_id:
|
|
type: string
|
|
required:
|
|
- shield_id
|
|
type: object
|
|
RegisterToolGroupRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
args:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
mcp_endpoint:
|
|
$ref: '#/components/schemas/URL'
|
|
provider_id:
|
|
type: string
|
|
toolgroup_id:
|
|
type: string
|
|
required:
|
|
- toolgroup_id
|
|
- provider_id
|
|
type: object
|
|
ResponseFormat:
|
|
oneOf:
|
|
- additionalProperties: false
|
|
properties:
|
|
json_schema:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
type:
|
|
const: json_schema
|
|
default: json_schema
|
|
type: string
|
|
required:
|
|
- type
|
|
- json_schema
|
|
type: object
|
|
- additionalProperties: false
|
|
properties:
|
|
bnf:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
type:
|
|
const: grammar
|
|
default: grammar
|
|
type: string
|
|
required:
|
|
- type
|
|
- bnf
|
|
type: object
|
|
RouteInfo:
|
|
additionalProperties: false
|
|
properties:
|
|
method:
|
|
type: string
|
|
provider_types:
|
|
items:
|
|
type: string
|
|
type: array
|
|
route:
|
|
type: string
|
|
required:
|
|
- route
|
|
- method
|
|
- provider_types
|
|
type: object
|
|
RunEvalRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
task_config:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/BenchmarkEvalTaskConfig'
|
|
- $ref: '#/components/schemas/AppEvalTaskConfig'
|
|
task_id:
|
|
type: string
|
|
required:
|
|
- task_id
|
|
- task_config
|
|
type: object
|
|
RunShieldRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
messages:
|
|
items:
|
|
$ref: '#/components/schemas/Message'
|
|
type: array
|
|
params:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
shield_id:
|
|
type: string
|
|
required:
|
|
- shield_id
|
|
- messages
|
|
- params
|
|
type: object
|
|
RunShieldResponse:
|
|
additionalProperties: false
|
|
properties:
|
|
violation:
|
|
$ref: '#/components/schemas/SafetyViolation'
|
|
type: object
|
|
SafetyViolation:
|
|
additionalProperties: false
|
|
properties:
|
|
metadata:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
user_message:
|
|
type: string
|
|
violation_level:
|
|
$ref: '#/components/schemas/ViolationLevel'
|
|
required:
|
|
- violation_level
|
|
- metadata
|
|
type: object
|
|
SamplingParams:
|
|
additionalProperties: false
|
|
properties:
|
|
max_tokens:
|
|
default: 0
|
|
type: integer
|
|
repetition_penalty:
|
|
default: 1.0
|
|
type: number
|
|
strategy:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/GreedySamplingStrategy'
|
|
- $ref: '#/components/schemas/TopPSamplingStrategy'
|
|
- $ref: '#/components/schemas/TopKSamplingStrategy'
|
|
required:
|
|
- strategy
|
|
type: object
|
|
SaveSpansToDatasetRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
attribute_filters:
|
|
items:
|
|
$ref: '#/components/schemas/QueryCondition'
|
|
type: array
|
|
attributes_to_save:
|
|
items:
|
|
type: string
|
|
type: array
|
|
dataset_id:
|
|
type: string
|
|
max_depth:
|
|
type: integer
|
|
required:
|
|
- attribute_filters
|
|
- attributes_to_save
|
|
- dataset_id
|
|
type: object
|
|
ScoreBatchRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
dataset_id:
|
|
type: string
|
|
save_results_dataset:
|
|
type: boolean
|
|
scoring_functions:
|
|
additionalProperties:
|
|
oneOf:
|
|
- oneOf:
|
|
- $ref: '#/components/schemas/LLMAsJudgeScoringFnParams'
|
|
- $ref: '#/components/schemas/RegexParserScoringFnParams'
|
|
- $ref: '#/components/schemas/BasicScoringFnParams'
|
|
- type: 'null'
|
|
type: object
|
|
required:
|
|
- dataset_id
|
|
- scoring_functions
|
|
- save_results_dataset
|
|
type: object
|
|
ScoreBatchResponse:
|
|
additionalProperties: false
|
|
properties:
|
|
dataset_id:
|
|
type: string
|
|
results:
|
|
additionalProperties:
|
|
$ref: '#/components/schemas/ScoringResult'
|
|
type: object
|
|
required:
|
|
- results
|
|
type: object
|
|
ScoreRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
input_rows:
|
|
items:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
type: array
|
|
scoring_functions:
|
|
additionalProperties:
|
|
oneOf:
|
|
- oneOf:
|
|
- $ref: '#/components/schemas/LLMAsJudgeScoringFnParams'
|
|
- $ref: '#/components/schemas/RegexParserScoringFnParams'
|
|
- $ref: '#/components/schemas/BasicScoringFnParams'
|
|
- type: 'null'
|
|
type: object
|
|
required:
|
|
- input_rows
|
|
- scoring_functions
|
|
type: object
|
|
ScoreResponse:
|
|
additionalProperties: false
|
|
properties:
|
|
results:
|
|
additionalProperties:
|
|
$ref: '#/components/schemas/ScoringResult'
|
|
type: object
|
|
required:
|
|
- results
|
|
type: object
|
|
ScoringFn:
|
|
additionalProperties: false
|
|
properties:
|
|
description:
|
|
type: string
|
|
identifier:
|
|
type: string
|
|
metadata:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
params:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/LLMAsJudgeScoringFnParams'
|
|
- $ref: '#/components/schemas/RegexParserScoringFnParams'
|
|
- $ref: '#/components/schemas/BasicScoringFnParams'
|
|
provider_id:
|
|
type: string
|
|
provider_resource_id:
|
|
type: string
|
|
return_type:
|
|
$ref: '#/components/schemas/ParamType'
|
|
type:
|
|
const: scoring_function
|
|
default: scoring_function
|
|
type: string
|
|
required:
|
|
- identifier
|
|
- provider_resource_id
|
|
- provider_id
|
|
- type
|
|
- metadata
|
|
- return_type
|
|
type: object
|
|
ScoringResult:
|
|
additionalProperties: false
|
|
properties:
|
|
aggregated_results:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
score_rows:
|
|
items:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
type: array
|
|
required:
|
|
- score_rows
|
|
- aggregated_results
|
|
type: object
|
|
Session:
|
|
additionalProperties: false
|
|
properties:
|
|
memory_bank:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/VectorMemoryBank'
|
|
- $ref: '#/components/schemas/KeyValueMemoryBank'
|
|
- $ref: '#/components/schemas/KeywordMemoryBank'
|
|
- $ref: '#/components/schemas/GraphMemoryBank'
|
|
session_id:
|
|
type: string
|
|
session_name:
|
|
type: string
|
|
started_at:
|
|
format: date-time
|
|
type: string
|
|
turns:
|
|
items:
|
|
$ref: '#/components/schemas/Turn'
|
|
type: array
|
|
required:
|
|
- session_id
|
|
- session_name
|
|
- turns
|
|
- started_at
|
|
title: A single session of an interaction with an Agentic System.
|
|
type: object
|
|
Shield:
|
|
additionalProperties: false
|
|
properties:
|
|
identifier:
|
|
type: string
|
|
params:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
provider_id:
|
|
type: string
|
|
provider_resource_id:
|
|
type: string
|
|
type:
|
|
const: shield
|
|
default: shield
|
|
type: string
|
|
required:
|
|
- identifier
|
|
- provider_resource_id
|
|
- provider_id
|
|
- type
|
|
title: A safety shield resource that can be used to check content
|
|
type: object
|
|
ShieldCallStep:
|
|
additionalProperties: false
|
|
properties:
|
|
completed_at:
|
|
format: date-time
|
|
type: string
|
|
started_at:
|
|
format: date-time
|
|
type: string
|
|
step_id:
|
|
type: string
|
|
step_type:
|
|
const: shield_call
|
|
default: shield_call
|
|
type: string
|
|
turn_id:
|
|
type: string
|
|
violation:
|
|
$ref: '#/components/schemas/SafetyViolation'
|
|
required:
|
|
- turn_id
|
|
- step_id
|
|
- step_type
|
|
type: object
|
|
Span:
|
|
additionalProperties: false
|
|
properties:
|
|
attributes:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
end_time:
|
|
format: date-time
|
|
type: string
|
|
name:
|
|
type: string
|
|
parent_span_id:
|
|
type: string
|
|
span_id:
|
|
type: string
|
|
start_time:
|
|
format: date-time
|
|
type: string
|
|
trace_id:
|
|
type: string
|
|
required:
|
|
- span_id
|
|
- trace_id
|
|
- name
|
|
- start_time
|
|
type: object
|
|
SpanEndPayload:
|
|
additionalProperties: false
|
|
properties:
|
|
status:
|
|
$ref: '#/components/schemas/SpanStatus'
|
|
type:
|
|
const: span_end
|
|
default: span_end
|
|
type: string
|
|
required:
|
|
- type
|
|
- status
|
|
type: object
|
|
SpanStartPayload:
|
|
additionalProperties: false
|
|
properties:
|
|
name:
|
|
type: string
|
|
parent_span_id:
|
|
type: string
|
|
type:
|
|
const: span_start
|
|
default: span_start
|
|
type: string
|
|
required:
|
|
- type
|
|
- name
|
|
type: object
|
|
SpanStatus:
|
|
enum:
|
|
- ok
|
|
- error
|
|
type: string
|
|
SpanWithStatus:
|
|
additionalProperties: false
|
|
properties:
|
|
attributes:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
end_time:
|
|
format: date-time
|
|
type: string
|
|
name:
|
|
type: string
|
|
parent_span_id:
|
|
type: string
|
|
span_id:
|
|
type: string
|
|
start_time:
|
|
format: date-time
|
|
type: string
|
|
status:
|
|
$ref: '#/components/schemas/SpanStatus'
|
|
trace_id:
|
|
type: string
|
|
required:
|
|
- span_id
|
|
- trace_id
|
|
- name
|
|
- start_time
|
|
type: object
|
|
StopReason:
|
|
enum:
|
|
- end_of_turn
|
|
- end_of_message
|
|
- out_of_tokens
|
|
type: string
|
|
StructuredLogEvent:
|
|
additionalProperties: false
|
|
properties:
|
|
attributes:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
payload:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/SpanStartPayload'
|
|
- $ref: '#/components/schemas/SpanEndPayload'
|
|
span_id:
|
|
type: string
|
|
timestamp:
|
|
format: date-time
|
|
type: string
|
|
trace_id:
|
|
type: string
|
|
type:
|
|
const: structured_log
|
|
default: structured_log
|
|
type: string
|
|
required:
|
|
- trace_id
|
|
- span_id
|
|
- timestamp
|
|
- type
|
|
- payload
|
|
type: object
|
|
SupervisedFineTuneRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
algorithm_config:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/LoraFinetuningConfig'
|
|
- $ref: '#/components/schemas/QATFinetuningConfig'
|
|
checkpoint_dir:
|
|
type: string
|
|
hyperparam_search_config:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
job_uuid:
|
|
type: string
|
|
logger_config:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
model:
|
|
type: string
|
|
training_config:
|
|
$ref: '#/components/schemas/TrainingConfig'
|
|
required:
|
|
- job_uuid
|
|
- training_config
|
|
- hyperparam_search_config
|
|
- logger_config
|
|
- model
|
|
type: object
|
|
SyntheticDataGenerateRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
dialogs:
|
|
items:
|
|
$ref: '#/components/schemas/Message'
|
|
type: array
|
|
filtering_function:
|
|
enum:
|
|
- none
|
|
- random
|
|
- top_k
|
|
- top_p
|
|
- top_k_top_p
|
|
- sigmoid
|
|
title: The type of filtering function.
|
|
type: string
|
|
model:
|
|
type: string
|
|
required:
|
|
- dialogs
|
|
- filtering_function
|
|
type: object
|
|
SyntheticDataGenerationResponse:
|
|
additionalProperties: false
|
|
properties:
|
|
statistics:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
synthetic_data:
|
|
items:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
type: array
|
|
required:
|
|
- synthetic_data
|
|
title: Response from the synthetic data generation. Batch of (prompt, response,
|
|
score) tuples that pass the threshold.
|
|
type: object
|
|
SystemMessage:
|
|
additionalProperties: false
|
|
properties:
|
|
content:
|
|
$ref: '#/components/schemas/InterleavedContent'
|
|
role:
|
|
const: system
|
|
default: system
|
|
type: string
|
|
required:
|
|
- role
|
|
- content
|
|
type: object
|
|
TextContentItem:
|
|
additionalProperties: false
|
|
properties:
|
|
text:
|
|
type: string
|
|
type:
|
|
const: text
|
|
default: text
|
|
type: string
|
|
required:
|
|
- type
|
|
- text
|
|
type: object
|
|
TokenLogProbs:
|
|
additionalProperties: false
|
|
properties:
|
|
logprobs_by_token:
|
|
additionalProperties:
|
|
type: number
|
|
type: object
|
|
required:
|
|
- logprobs_by_token
|
|
type: object
|
|
Tool:
|
|
additionalProperties: false
|
|
properties:
|
|
description:
|
|
type: string
|
|
identifier:
|
|
type: string
|
|
metadata:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
parameters:
|
|
items:
|
|
$ref: '#/components/schemas/ToolParameter'
|
|
type: array
|
|
provider_id:
|
|
type: string
|
|
provider_resource_id:
|
|
type: string
|
|
tool_host:
|
|
$ref: '#/components/schemas/ToolHost'
|
|
toolgroup_id:
|
|
type: string
|
|
type:
|
|
const: tool
|
|
default: tool
|
|
type: string
|
|
required:
|
|
- identifier
|
|
- provider_resource_id
|
|
- provider_id
|
|
- type
|
|
- toolgroup_id
|
|
- tool_host
|
|
- description
|
|
- parameters
|
|
type: object
|
|
ToolCall:
|
|
additionalProperties: false
|
|
properties:
|
|
arguments:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: string
|
|
- type: integer
|
|
- type: number
|
|
- type: boolean
|
|
- type: 'null'
|
|
- items:
|
|
oneOf:
|
|
- type: string
|
|
- type: integer
|
|
- type: number
|
|
- type: boolean
|
|
- type: 'null'
|
|
type: array
|
|
- additionalProperties:
|
|
oneOf:
|
|
- type: string
|
|
- type: integer
|
|
- type: number
|
|
- type: boolean
|
|
- type: 'null'
|
|
type: object
|
|
type: object
|
|
call_id:
|
|
type: string
|
|
tool_name:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/BuiltinTool'
|
|
- type: string
|
|
required:
|
|
- call_id
|
|
- tool_name
|
|
- arguments
|
|
type: object
|
|
ToolCallDelta:
|
|
additionalProperties: false
|
|
properties:
|
|
content:
|
|
oneOf:
|
|
- type: string
|
|
- $ref: '#/components/schemas/ToolCall'
|
|
parse_status:
|
|
$ref: '#/components/schemas/ToolCallParseStatus'
|
|
type:
|
|
const: tool_call
|
|
default: tool_call
|
|
type: string
|
|
required:
|
|
- type
|
|
- content
|
|
- parse_status
|
|
type: object
|
|
ToolCallParseStatus:
|
|
enum:
|
|
- started
|
|
- in_progress
|
|
- failed
|
|
- succeeded
|
|
type: string
|
|
ToolChoice:
|
|
enum:
|
|
- auto
|
|
- required
|
|
type: string
|
|
ToolDef:
|
|
additionalProperties: false
|
|
properties:
|
|
description:
|
|
type: string
|
|
metadata:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
name:
|
|
type: string
|
|
parameters:
|
|
items:
|
|
$ref: '#/components/schemas/ToolParameter'
|
|
type: array
|
|
required:
|
|
- name
|
|
type: object
|
|
ToolDefinition:
|
|
additionalProperties: false
|
|
properties:
|
|
description:
|
|
type: string
|
|
parameters:
|
|
additionalProperties:
|
|
$ref: '#/components/schemas/ToolParamDefinition'
|
|
type: object
|
|
tool_name:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/BuiltinTool'
|
|
- type: string
|
|
required:
|
|
- tool_name
|
|
type: object
|
|
ToolExecutionStep:
|
|
additionalProperties: false
|
|
properties:
|
|
completed_at:
|
|
format: date-time
|
|
type: string
|
|
started_at:
|
|
format: date-time
|
|
type: string
|
|
step_id:
|
|
type: string
|
|
step_type:
|
|
const: tool_execution
|
|
default: tool_execution
|
|
type: string
|
|
tool_calls:
|
|
items:
|
|
$ref: '#/components/schemas/ToolCall'
|
|
type: array
|
|
tool_responses:
|
|
items:
|
|
$ref: '#/components/schemas/ToolResponse'
|
|
type: array
|
|
turn_id:
|
|
type: string
|
|
required:
|
|
- turn_id
|
|
- step_id
|
|
- step_type
|
|
- tool_calls
|
|
- tool_responses
|
|
type: object
|
|
ToolGroup:
|
|
additionalProperties: false
|
|
properties:
|
|
args:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
identifier:
|
|
type: string
|
|
mcp_endpoint:
|
|
$ref: '#/components/schemas/URL'
|
|
provider_id:
|
|
type: string
|
|
provider_resource_id:
|
|
type: string
|
|
type:
|
|
const: tool_group
|
|
default: tool_group
|
|
type: string
|
|
required:
|
|
- identifier
|
|
- provider_resource_id
|
|
- provider_id
|
|
- type
|
|
type: object
|
|
ToolHost:
|
|
enum:
|
|
- distribution
|
|
- client
|
|
- model_context_protocol
|
|
type: string
|
|
ToolInvocationResult:
|
|
additionalProperties: false
|
|
properties:
|
|
content:
|
|
$ref: '#/components/schemas/InterleavedContent'
|
|
error_code:
|
|
type: integer
|
|
error_message:
|
|
type: string
|
|
required:
|
|
- content
|
|
type: object
|
|
ToolParamDefinition:
|
|
additionalProperties: false
|
|
properties:
|
|
default:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
description:
|
|
type: string
|
|
param_type:
|
|
type: string
|
|
required:
|
|
default: true
|
|
type: boolean
|
|
required:
|
|
- param_type
|
|
type: object
|
|
ToolParameter:
|
|
additionalProperties: false
|
|
properties:
|
|
default:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
description:
|
|
type: string
|
|
name:
|
|
type: string
|
|
parameter_type:
|
|
type: string
|
|
required:
|
|
default: true
|
|
type: boolean
|
|
required:
|
|
- name
|
|
- parameter_type
|
|
- description
|
|
- required
|
|
type: object
|
|
ToolPromptFormat:
|
|
description: "`json` --\n Refers to the json format for calling tools.\n\
|
|
\ The json format takes the form like\n {\n \"type\": \"function\"\
|
|
,\n \"function\" : {\n \"name\": \"function_name\",\n \
|
|
\ \"description\": \"function_description\",\n \"parameters\"\
|
|
: {...}\n }\n }\n\n`function_tag` --\n This is an example of\
|
|
\ how you could define\n your own user defined format for making tool calls.\n\
|
|
\ The function_tag format looks like this,\n <function=function_name>(parameters)</function>\n\
|
|
\nThe detailed prompts for each of these formats are added to llama cli"
|
|
enum:
|
|
- json
|
|
- function_tag
|
|
- python_list
|
|
title: This Enum refers to the prompt format for calling custom / zero shot
|
|
tools
|
|
type: string
|
|
ToolResponse:
|
|
additionalProperties: false
|
|
properties:
|
|
call_id:
|
|
type: string
|
|
content:
|
|
$ref: '#/components/schemas/InterleavedContent'
|
|
tool_name:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/BuiltinTool'
|
|
- type: string
|
|
required:
|
|
- call_id
|
|
- tool_name
|
|
- content
|
|
type: object
|
|
ToolResponseMessage:
|
|
additionalProperties: false
|
|
properties:
|
|
call_id:
|
|
type: string
|
|
content:
|
|
$ref: '#/components/schemas/InterleavedContent'
|
|
role:
|
|
const: tool
|
|
default: tool
|
|
type: string
|
|
tool_name:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/BuiltinTool'
|
|
- type: string
|
|
required:
|
|
- role
|
|
- call_id
|
|
- tool_name
|
|
- content
|
|
type: object
|
|
TopKSamplingStrategy:
|
|
additionalProperties: false
|
|
properties:
|
|
top_k:
|
|
type: integer
|
|
type:
|
|
const: top_k
|
|
default: top_k
|
|
type: string
|
|
required:
|
|
- type
|
|
- top_k
|
|
type: object
|
|
TopPSamplingStrategy:
|
|
additionalProperties: false
|
|
properties:
|
|
temperature:
|
|
type: number
|
|
top_p:
|
|
default: 0.95
|
|
type: number
|
|
type:
|
|
const: top_p
|
|
default: top_p
|
|
type: string
|
|
required:
|
|
- type
|
|
type: object
|
|
Trace:
|
|
additionalProperties: false
|
|
properties:
|
|
end_time:
|
|
format: date-time
|
|
type: string
|
|
root_span_id:
|
|
type: string
|
|
start_time:
|
|
format: date-time
|
|
type: string
|
|
trace_id:
|
|
type: string
|
|
required:
|
|
- trace_id
|
|
- root_span_id
|
|
- start_time
|
|
type: object
|
|
TrainingConfig:
|
|
additionalProperties: false
|
|
properties:
|
|
data_config:
|
|
$ref: '#/components/schemas/DataConfig'
|
|
dtype:
|
|
default: bf16
|
|
type: string
|
|
efficiency_config:
|
|
$ref: '#/components/schemas/EfficiencyConfig'
|
|
gradient_accumulation_steps:
|
|
type: integer
|
|
max_steps_per_epoch:
|
|
type: integer
|
|
max_validation_steps:
|
|
type: integer
|
|
n_epochs:
|
|
type: integer
|
|
optimizer_config:
|
|
$ref: '#/components/schemas/OptimizerConfig'
|
|
required:
|
|
- n_epochs
|
|
- max_steps_per_epoch
|
|
- gradient_accumulation_steps
|
|
- max_validation_steps
|
|
- data_config
|
|
- optimizer_config
|
|
type: object
|
|
Turn:
|
|
additionalProperties: false
|
|
properties:
|
|
completed_at:
|
|
format: date-time
|
|
type: string
|
|
input_messages:
|
|
items:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/UserMessage'
|
|
- $ref: '#/components/schemas/ToolResponseMessage'
|
|
type: array
|
|
output_attachments:
|
|
items:
|
|
additionalProperties: false
|
|
properties:
|
|
content:
|
|
oneOf:
|
|
- type: string
|
|
- $ref: '#/components/schemas/InterleavedContentItem'
|
|
- items:
|
|
$ref: '#/components/schemas/InterleavedContentItem'
|
|
type: array
|
|
- $ref: '#/components/schemas/URL'
|
|
mime_type:
|
|
type: string
|
|
required:
|
|
- content
|
|
- mime_type
|
|
type: object
|
|
type: array
|
|
output_message:
|
|
$ref: '#/components/schemas/CompletionMessage'
|
|
session_id:
|
|
type: string
|
|
started_at:
|
|
format: date-time
|
|
type: string
|
|
steps:
|
|
items:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/InferenceStep'
|
|
- $ref: '#/components/schemas/ToolExecutionStep'
|
|
- $ref: '#/components/schemas/ShieldCallStep'
|
|
- $ref: '#/components/schemas/MemoryRetrievalStep'
|
|
type: array
|
|
turn_id:
|
|
type: string
|
|
required:
|
|
- turn_id
|
|
- session_id
|
|
- input_messages
|
|
- steps
|
|
- output_message
|
|
- output_attachments
|
|
- started_at
|
|
title: A single turn in an interaction with an Agentic System.
|
|
type: object
|
|
URL:
|
|
additionalProperties: false
|
|
properties:
|
|
uri:
|
|
type: string
|
|
required:
|
|
- uri
|
|
type: object
|
|
UnregisterDatasetRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
dataset_id:
|
|
type: string
|
|
required:
|
|
- dataset_id
|
|
type: object
|
|
UnregisterMemoryBankRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
memory_bank_id:
|
|
type: string
|
|
required:
|
|
- memory_bank_id
|
|
type: object
|
|
UnregisterModelRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
model_id:
|
|
type: string
|
|
required:
|
|
- model_id
|
|
type: object
|
|
UnregisterToolGroupRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
tool_group_id:
|
|
type: string
|
|
required:
|
|
- tool_group_id
|
|
type: object
|
|
UnstructuredLogEvent:
|
|
additionalProperties: false
|
|
properties:
|
|
attributes:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
message:
|
|
type: string
|
|
severity:
|
|
$ref: '#/components/schemas/LogSeverity'
|
|
span_id:
|
|
type: string
|
|
timestamp:
|
|
format: date-time
|
|
type: string
|
|
trace_id:
|
|
type: string
|
|
type:
|
|
const: unstructured_log
|
|
default: unstructured_log
|
|
type: string
|
|
required:
|
|
- trace_id
|
|
- span_id
|
|
- timestamp
|
|
- type
|
|
- message
|
|
- severity
|
|
type: object
|
|
UserMessage:
|
|
additionalProperties: false
|
|
properties:
|
|
content:
|
|
$ref: '#/components/schemas/InterleavedContent'
|
|
context:
|
|
$ref: '#/components/schemas/InterleavedContent'
|
|
role:
|
|
const: user
|
|
default: user
|
|
type: string
|
|
required:
|
|
- role
|
|
- content
|
|
type: object
|
|
VectorMemoryBank:
|
|
additionalProperties: false
|
|
properties:
|
|
chunk_size_in_tokens:
|
|
type: integer
|
|
embedding_dimension:
|
|
default: 384
|
|
type: integer
|
|
embedding_model:
|
|
type: string
|
|
identifier:
|
|
type: string
|
|
memory_bank_type:
|
|
const: vector
|
|
default: vector
|
|
type: string
|
|
overlap_size_in_tokens:
|
|
type: integer
|
|
provider_id:
|
|
type: string
|
|
provider_resource_id:
|
|
type: string
|
|
type:
|
|
const: memory_bank
|
|
default: memory_bank
|
|
type: string
|
|
required:
|
|
- identifier
|
|
- provider_resource_id
|
|
- provider_id
|
|
- type
|
|
- memory_bank_type
|
|
- embedding_model
|
|
- chunk_size_in_tokens
|
|
type: object
|
|
VectorMemoryBankParams:
|
|
additionalProperties: false
|
|
properties:
|
|
chunk_size_in_tokens:
|
|
type: integer
|
|
embedding_model:
|
|
type: string
|
|
memory_bank_type:
|
|
const: vector
|
|
default: vector
|
|
type: string
|
|
overlap_size_in_tokens:
|
|
type: integer
|
|
required:
|
|
- memory_bank_type
|
|
- embedding_model
|
|
- chunk_size_in_tokens
|
|
type: object
|
|
VersionInfo:
|
|
additionalProperties: false
|
|
properties:
|
|
version:
|
|
type: string
|
|
required:
|
|
- version
|
|
type: object
|
|
ViolationLevel:
|
|
enum:
|
|
- info
|
|
- warn
|
|
- error
|
|
type: string
|
|
info:
|
|
description: "This is the specification of the Llama Stack that provides\n \
|
|
\ a set of endpoints and their corresponding interfaces that are tailored\
|
|
\ to\n best leverage Llama Models."
|
|
title: Llama Stack Specification
|
|
version: alpha
|
|
jsonSchemaDialect: https://json-schema.org/draft/2020-12/schema
|
|
openapi: 3.1.0
|
|
paths:
|
|
/alpha/agents/create:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/CreateAgentRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/AgentCreateResponse'
|
|
description: OK
|
|
tags:
|
|
- Agents
|
|
/alpha/agents/delete:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/DeleteAgentsRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
description: OK
|
|
tags:
|
|
- Agents
|
|
/alpha/agents/session/create:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/CreateAgentSessionRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/AgentSessionCreateResponse'
|
|
description: OK
|
|
tags:
|
|
- Agents
|
|
/alpha/agents/session/delete:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/DeleteAgentsSessionRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
description: OK
|
|
tags:
|
|
- Agents
|
|
/alpha/agents/session/get:
|
|
post:
|
|
parameters:
|
|
- in: query
|
|
name: agent_id
|
|
required: true
|
|
schema:
|
|
type: string
|
|
- in: query
|
|
name: session_id
|
|
required: true
|
|
schema:
|
|
type: string
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/GetAgentsSessionRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/Session'
|
|
description: OK
|
|
tags:
|
|
- Agents
|
|
/alpha/agents/step/get:
|
|
get:
|
|
parameters:
|
|
- in: query
|
|
name: agent_id
|
|
required: true
|
|
schema:
|
|
type: string
|
|
- in: query
|
|
name: session_id
|
|
required: true
|
|
schema:
|
|
type: string
|
|
- in: query
|
|
name: turn_id
|
|
required: true
|
|
schema:
|
|
type: string
|
|
- in: query
|
|
name: step_id
|
|
required: true
|
|
schema:
|
|
type: string
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/AgentStepResponse'
|
|
description: OK
|
|
tags:
|
|
- Agents
|
|
/alpha/agents/turn/create:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/CreateAgentTurnRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
content:
|
|
text/event-stream:
|
|
schema:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/Turn'
|
|
- $ref: '#/components/schemas/AgentTurnResponseStreamChunk'
|
|
description: A single turn in an interaction with an Agentic System. **OR**
|
|
streamed agent turn completion response.
|
|
tags:
|
|
- Agents
|
|
/alpha/agents/turn/get:
|
|
get:
|
|
parameters:
|
|
- in: query
|
|
name: agent_id
|
|
required: true
|
|
schema:
|
|
type: string
|
|
- in: query
|
|
name: session_id
|
|
required: true
|
|
schema:
|
|
type: string
|
|
- in: query
|
|
name: turn_id
|
|
required: true
|
|
schema:
|
|
type: string
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/Turn'
|
|
description: OK
|
|
tags:
|
|
- Agents
|
|
/alpha/batch-inference/chat-completion:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/BatchChatCompletionRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/BatchChatCompletionResponse'
|
|
description: OK
|
|
tags:
|
|
- BatchInference (Coming Soon)
|
|
/alpha/batch-inference/completion:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/BatchCompletionRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/BatchCompletionResponse'
|
|
description: OK
|
|
tags:
|
|
- BatchInference (Coming Soon)
|
|
/alpha/datasetio/append-rows:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/AppendRowsRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
description: OK
|
|
tags:
|
|
- DatasetIO
|
|
/alpha/datasetio/get-rows-paginated:
|
|
get:
|
|
parameters:
|
|
- in: query
|
|
name: dataset_id
|
|
required: true
|
|
schema:
|
|
type: string
|
|
- in: query
|
|
name: rows_in_page
|
|
required: true
|
|
schema:
|
|
type: integer
|
|
- in: query
|
|
name: page_token
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- in: query
|
|
name: filter_condition
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/PaginatedRowsResult'
|
|
description: OK
|
|
tags:
|
|
- DatasetIO
|
|
/alpha/datasets/get:
|
|
get:
|
|
parameters:
|
|
- in: query
|
|
name: dataset_id
|
|
required: true
|
|
schema:
|
|
type: string
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/Dataset'
|
|
- type: 'null'
|
|
description: OK
|
|
tags:
|
|
- Datasets
|
|
/alpha/datasets/list:
|
|
get:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/jsonl:
|
|
schema:
|
|
$ref: '#/components/schemas/Dataset'
|
|
description: OK
|
|
tags:
|
|
- Datasets
|
|
/alpha/datasets/register:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/RegisterDatasetRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
description: OK
|
|
tags:
|
|
- Datasets
|
|
/alpha/datasets/unregister:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/UnregisterDatasetRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
description: OK
|
|
tags:
|
|
- Datasets
|
|
/alpha/eval-tasks/get:
|
|
get:
|
|
parameters:
|
|
- in: query
|
|
name: name
|
|
required: true
|
|
schema:
|
|
type: string
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/EvalTask'
|
|
- type: 'null'
|
|
description: OK
|
|
tags:
|
|
- EvalTasks
|
|
/alpha/eval-tasks/list:
|
|
get:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/jsonl:
|
|
schema:
|
|
$ref: '#/components/schemas/EvalTask'
|
|
description: OK
|
|
tags:
|
|
- EvalTasks
|
|
/alpha/eval-tasks/register:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/RegisterEvalTaskRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
description: OK
|
|
tags:
|
|
- EvalTasks
|
|
/alpha/eval/evaluate-rows:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/EvaluateRowsRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/EvaluateResponse'
|
|
description: OK
|
|
tags:
|
|
- Eval
|
|
/alpha/eval/job/cancel:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/JobCancelRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
description: OK
|
|
tags:
|
|
- Eval
|
|
/alpha/eval/job/result:
|
|
get:
|
|
parameters:
|
|
- in: query
|
|
name: task_id
|
|
required: true
|
|
schema:
|
|
type: string
|
|
- in: query
|
|
name: job_id
|
|
required: true
|
|
schema:
|
|
type: string
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/EvaluateResponse'
|
|
description: OK
|
|
tags:
|
|
- Eval
|
|
/alpha/eval/job/status:
|
|
get:
|
|
parameters:
|
|
- in: query
|
|
name: task_id
|
|
required: true
|
|
schema:
|
|
type: string
|
|
- in: query
|
|
name: job_id
|
|
required: true
|
|
schema:
|
|
type: string
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/JobStatus'
|
|
- type: 'null'
|
|
description: OK
|
|
tags:
|
|
- Eval
|
|
/alpha/eval/run-eval:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/RunEvalRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/Job'
|
|
description: OK
|
|
tags:
|
|
- Eval
|
|
/alpha/health:
|
|
get:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/HealthInfo'
|
|
description: OK
|
|
tags:
|
|
- Inspect
|
|
/alpha/inference/chat-completion:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/ChatCompletionRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
content:
|
|
text/event-stream:
|
|
schema:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/ChatCompletionResponse'
|
|
- $ref: '#/components/schemas/ChatCompletionResponseStreamChunk'
|
|
description: Chat completion response. **OR** SSE-stream of these events.
|
|
tags:
|
|
- Inference
|
|
/alpha/inference/completion:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/CompletionRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
content:
|
|
text/event-stream:
|
|
schema:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/CompletionResponse'
|
|
- $ref: '#/components/schemas/CompletionResponseStreamChunk'
|
|
description: Completion response. **OR** streamed completion response.
|
|
tags:
|
|
- Inference
|
|
/alpha/inference/embeddings:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/EmbeddingsRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/EmbeddingsResponse'
|
|
description: OK
|
|
tags:
|
|
- Inference
|
|
/alpha/memory-banks/get:
|
|
get:
|
|
parameters:
|
|
- in: query
|
|
name: memory_bank_id
|
|
required: true
|
|
schema:
|
|
type: string
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
oneOf:
|
|
- oneOf:
|
|
- $ref: '#/components/schemas/VectorMemoryBank'
|
|
- $ref: '#/components/schemas/KeyValueMemoryBank'
|
|
- $ref: '#/components/schemas/KeywordMemoryBank'
|
|
- $ref: '#/components/schemas/GraphMemoryBank'
|
|
- type: 'null'
|
|
description: OK
|
|
tags:
|
|
- MemoryBanks
|
|
/alpha/memory-banks/list:
|
|
get:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/jsonl:
|
|
schema:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/VectorMemoryBank'
|
|
- $ref: '#/components/schemas/KeyValueMemoryBank'
|
|
- $ref: '#/components/schemas/KeywordMemoryBank'
|
|
- $ref: '#/components/schemas/GraphMemoryBank'
|
|
description: OK
|
|
tags:
|
|
- MemoryBanks
|
|
/alpha/memory-banks/register:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/RegisterMemoryBankRequest'
|
|
required: true
|
|
responses: {}
|
|
tags:
|
|
- MemoryBanks
|
|
/alpha/memory-banks/unregister:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/UnregisterMemoryBankRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
description: OK
|
|
tags:
|
|
- MemoryBanks
|
|
/alpha/memory/insert:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/InsertDocumentsRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
description: OK
|
|
tags:
|
|
- Memory
|
|
/alpha/memory/query:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/QueryDocumentsRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/QueryDocumentsResponse'
|
|
description: OK
|
|
tags:
|
|
- Memory
|
|
/alpha/models/get:
|
|
get:
|
|
parameters:
|
|
- in: query
|
|
name: identifier
|
|
required: true
|
|
schema:
|
|
type: string
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/Model'
|
|
- type: 'null'
|
|
description: OK
|
|
tags:
|
|
- Models
|
|
/alpha/models/list:
|
|
get:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/jsonl:
|
|
schema:
|
|
$ref: '#/components/schemas/Model'
|
|
description: OK
|
|
tags:
|
|
- Models
|
|
/alpha/models/register:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/RegisterModelRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/Model'
|
|
description: OK
|
|
tags:
|
|
- Models
|
|
/alpha/models/unregister:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/UnregisterModelRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
description: OK
|
|
tags:
|
|
- Models
|
|
/alpha/post-training/job/artifacts:
|
|
get:
|
|
parameters:
|
|
- in: query
|
|
name: job_uuid
|
|
required: true
|
|
schema:
|
|
type: string
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/PostTrainingJobArtifactsResponse'
|
|
- type: 'null'
|
|
description: OK
|
|
tags:
|
|
- PostTraining (Coming Soon)
|
|
/alpha/post-training/job/cancel:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/CancelTrainingJobRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
description: OK
|
|
tags:
|
|
- PostTraining (Coming Soon)
|
|
/alpha/post-training/job/status:
|
|
get:
|
|
parameters:
|
|
- in: query
|
|
name: job_uuid
|
|
required: true
|
|
schema:
|
|
type: string
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/PostTrainingJobStatusResponse'
|
|
- type: 'null'
|
|
description: OK
|
|
tags:
|
|
- PostTraining (Coming Soon)
|
|
/alpha/post-training/jobs:
|
|
get:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/jsonl:
|
|
schema:
|
|
$ref: '#/components/schemas/PostTrainingJob'
|
|
description: OK
|
|
tags:
|
|
- PostTraining (Coming Soon)
|
|
/alpha/post-training/preference-optimize:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/PreferenceOptimizeRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/PostTrainingJob'
|
|
description: OK
|
|
tags:
|
|
- PostTraining (Coming Soon)
|
|
/alpha/post-training/supervised-fine-tune:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/SupervisedFineTuneRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/PostTrainingJob'
|
|
description: OK
|
|
tags:
|
|
- PostTraining (Coming Soon)
|
|
/alpha/providers/list:
|
|
get:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
additionalProperties:
|
|
$ref: '#/components/schemas/ProviderInfo'
|
|
type: object
|
|
description: OK
|
|
tags:
|
|
- Inspect
|
|
/alpha/routes/list:
|
|
get:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
additionalProperties:
|
|
items:
|
|
$ref: '#/components/schemas/RouteInfo'
|
|
type: array
|
|
type: object
|
|
description: OK
|
|
tags:
|
|
- Inspect
|
|
/alpha/safety/run-shield:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/RunShieldRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/RunShieldResponse'
|
|
description: OK
|
|
tags:
|
|
- Safety
|
|
/alpha/scoring-functions/get:
|
|
get:
|
|
parameters:
|
|
- in: query
|
|
name: scoring_fn_id
|
|
required: true
|
|
schema:
|
|
type: string
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/ScoringFn'
|
|
- type: 'null'
|
|
description: OK
|
|
tags:
|
|
- ScoringFunctions
|
|
/alpha/scoring-functions/list:
|
|
get:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/jsonl:
|
|
schema:
|
|
$ref: '#/components/schemas/ScoringFn'
|
|
description: OK
|
|
tags:
|
|
- ScoringFunctions
|
|
/alpha/scoring-functions/register:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/RegisterScoringFunctionRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
description: OK
|
|
tags:
|
|
- ScoringFunctions
|
|
/alpha/scoring/score:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/ScoreRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/ScoreResponse'
|
|
description: OK
|
|
tags:
|
|
- Scoring
|
|
/alpha/scoring/score-batch:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/ScoreBatchRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/ScoreBatchResponse'
|
|
description: OK
|
|
tags:
|
|
- Scoring
|
|
/alpha/shields/get:
|
|
get:
|
|
parameters:
|
|
- in: query
|
|
name: identifier
|
|
required: true
|
|
schema:
|
|
type: string
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/Shield'
|
|
- type: 'null'
|
|
description: OK
|
|
tags:
|
|
- Shields
|
|
/alpha/shields/list:
|
|
get:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/jsonl:
|
|
schema:
|
|
$ref: '#/components/schemas/Shield'
|
|
description: OK
|
|
tags:
|
|
- Shields
|
|
/alpha/shields/register:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/RegisterShieldRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/Shield'
|
|
description: OK
|
|
tags:
|
|
- Shields
|
|
/alpha/synthetic-data-generation/generate:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/SyntheticDataGenerateRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/SyntheticDataGenerationResponse'
|
|
description: OK
|
|
tags:
|
|
- SyntheticDataGeneration (Coming Soon)
|
|
/alpha/telemetry/get-span-tree:
|
|
post:
|
|
parameters:
|
|
- in: query
|
|
name: span_id
|
|
required: true
|
|
schema:
|
|
type: string
|
|
- in: query
|
|
name: max_depth
|
|
required: false
|
|
schema:
|
|
type: integer
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/GetSpanTreeRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
additionalProperties:
|
|
$ref: '#/components/schemas/SpanWithStatus'
|
|
type: object
|
|
description: OK
|
|
tags:
|
|
- Telemetry
|
|
/alpha/telemetry/log-event:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/LogEventRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
description: OK
|
|
tags:
|
|
- Telemetry
|
|
/alpha/telemetry/query-spans:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/QuerySpansRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/jsonl:
|
|
schema:
|
|
$ref: '#/components/schemas/Span'
|
|
description: OK
|
|
tags:
|
|
- Telemetry
|
|
/alpha/telemetry/query-traces:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/QueryTracesRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/jsonl:
|
|
schema:
|
|
$ref: '#/components/schemas/Trace'
|
|
description: OK
|
|
tags:
|
|
- Telemetry
|
|
/alpha/telemetry/save-spans-to-dataset:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/SaveSpansToDatasetRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
description: OK
|
|
tags:
|
|
- Telemetry
|
|
/alpha/tool-runtime/invoke:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/InvokeToolRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/ToolInvocationResult'
|
|
description: OK
|
|
summary: Run a tool with the given arguments
|
|
tags:
|
|
- ToolRuntime
|
|
/alpha/tool-runtime/list-tools:
|
|
post:
|
|
parameters:
|
|
- in: query
|
|
name: tool_group_id
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/ListRuntimeToolsRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/jsonl:
|
|
schema:
|
|
$ref: '#/components/schemas/ToolDef'
|
|
description: OK
|
|
tags:
|
|
- ToolRuntime
|
|
/alpha/toolgroups/get:
|
|
get:
|
|
parameters:
|
|
- in: query
|
|
name: toolgroup_id
|
|
required: true
|
|
schema:
|
|
type: string
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/ToolGroup'
|
|
description: OK
|
|
tags:
|
|
- ToolGroups
|
|
/alpha/toolgroups/list:
|
|
get:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/jsonl:
|
|
schema:
|
|
$ref: '#/components/schemas/ToolGroup'
|
|
description: OK
|
|
summary: List tool groups with optional provider
|
|
tags:
|
|
- ToolGroups
|
|
/alpha/toolgroups/register:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/RegisterToolGroupRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
description: OK
|
|
summary: Register a tool group
|
|
tags:
|
|
- ToolGroups
|
|
/alpha/toolgroups/unregister:
|
|
post:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/UnregisterToolGroupRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
description: OK
|
|
summary: Unregister a tool group
|
|
tags:
|
|
- ToolGroups
|
|
/alpha/tools/get:
|
|
get:
|
|
parameters:
|
|
- in: query
|
|
name: tool_name
|
|
required: true
|
|
schema:
|
|
type: string
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/Tool'
|
|
description: OK
|
|
tags:
|
|
- ToolGroups
|
|
/alpha/tools/list:
|
|
get:
|
|
parameters:
|
|
- in: query
|
|
name: tool_group_id
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/jsonl:
|
|
schema:
|
|
$ref: '#/components/schemas/Tool'
|
|
description: OK
|
|
summary: List tools with optional tool group
|
|
tags:
|
|
- ToolGroups
|
|
/alpha/version:
|
|
get:
|
|
parameters:
|
|
- description: JSON-encoded provider data which will be made available to the
|
|
adapter servicing the API
|
|
in: header
|
|
name: X-LlamaStack-Provider-Data
|
|
required: false
|
|
schema:
|
|
type: string
|
|
- description: Version of the client making the request. This is used to ensure
|
|
that the client and server are compatible.
|
|
in: header
|
|
name: X-LlamaStack-Client-Version
|
|
required: false
|
|
schema:
|
|
type: string
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/VersionInfo'
|
|
description: OK
|
|
tags:
|
|
- Inspect
|
|
security:
|
|
- Default: []
|
|
servers:
|
|
- url: http://any-hosted-llama-stack.com
|
|
tags:
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/AgentCandidate" />
|
|
name: AgentCandidate
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/AgentConfig" />
|
|
name: AgentConfig
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/AgentCreateResponse"
|
|
/>
|
|
name: AgentCreateResponse
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/AgentSessionCreateResponse"
|
|
/>
|
|
name: AgentSessionCreateResponse
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/AgentStepResponse"
|
|
/>
|
|
name: AgentStepResponse
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/AgentTool" />
|
|
name: AgentTool
|
|
- description: 'Streamed agent execution response.
|
|
|
|
|
|
<SchemaDefinition schemaRef="#/components/schemas/AgentTurnResponseEvent" />'
|
|
name: AgentTurnResponseEvent
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/AgentTurnResponseStepCompletePayload"
|
|
/>
|
|
name: AgentTurnResponseStepCompletePayload
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/AgentTurnResponseStepProgressPayload"
|
|
/>
|
|
name: AgentTurnResponseStepProgressPayload
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/AgentTurnResponseStepStartPayload"
|
|
/>
|
|
name: AgentTurnResponseStepStartPayload
|
|
- description: 'streamed agent turn completion response.
|
|
|
|
|
|
<SchemaDefinition schemaRef="#/components/schemas/AgentTurnResponseStreamChunk"
|
|
/>'
|
|
name: AgentTurnResponseStreamChunk
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/AgentTurnResponseTurnCompletePayload"
|
|
/>
|
|
name: AgentTurnResponseTurnCompletePayload
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/AgentTurnResponseTurnStartPayload"
|
|
/>
|
|
name: AgentTurnResponseTurnStartPayload
|
|
- name: Agents
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/AggregationFunctionType"
|
|
/>
|
|
name: AggregationFunctionType
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/AppEvalTaskConfig"
|
|
/>
|
|
name: AppEvalTaskConfig
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/AppendRowsRequest"
|
|
/>
|
|
name: AppendRowsRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/BasicScoringFnParams"
|
|
/>
|
|
name: BasicScoringFnParams
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/BatchChatCompletionRequest"
|
|
/>
|
|
name: BatchChatCompletionRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/BatchChatCompletionResponse"
|
|
/>
|
|
name: BatchChatCompletionResponse
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/BatchCompletionRequest"
|
|
/>
|
|
name: BatchCompletionRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/BatchCompletionResponse"
|
|
/>
|
|
name: BatchCompletionResponse
|
|
- name: BatchInference (Coming Soon)
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/BenchmarkEvalTaskConfig"
|
|
/>
|
|
name: BenchmarkEvalTaskConfig
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/BuiltinTool" />
|
|
name: BuiltinTool
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/CancelTrainingJobRequest"
|
|
/>
|
|
name: CancelTrainingJobRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ChatCompletionRequest"
|
|
/>
|
|
name: ChatCompletionRequest
|
|
- description: 'Chat completion response.
|
|
|
|
|
|
<SchemaDefinition schemaRef="#/components/schemas/ChatCompletionResponse" />'
|
|
name: ChatCompletionResponse
|
|
- description: 'Chat completion response event.
|
|
|
|
|
|
<SchemaDefinition schemaRef="#/components/schemas/ChatCompletionResponseEvent"
|
|
/>'
|
|
name: ChatCompletionResponseEvent
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ChatCompletionResponseEventType"
|
|
/>
|
|
name: ChatCompletionResponseEventType
|
|
- description: 'SSE-stream of these events.
|
|
|
|
|
|
<SchemaDefinition schemaRef="#/components/schemas/ChatCompletionResponseStreamChunk"
|
|
/>'
|
|
name: ChatCompletionResponseStreamChunk
|
|
- description: 'Checkpoint created during training runs
|
|
|
|
|
|
<SchemaDefinition schemaRef="#/components/schemas/Checkpoint" />'
|
|
name: Checkpoint
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/CompletionMessage"
|
|
/>
|
|
name: CompletionMessage
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/CompletionRequest"
|
|
/>
|
|
name: CompletionRequest
|
|
- description: 'Completion response.
|
|
|
|
|
|
<SchemaDefinition schemaRef="#/components/schemas/CompletionResponse" />'
|
|
name: CompletionResponse
|
|
- description: 'streamed completion response.
|
|
|
|
|
|
<SchemaDefinition schemaRef="#/components/schemas/CompletionResponseStreamChunk"
|
|
/>'
|
|
name: CompletionResponseStreamChunk
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ContentDelta" />
|
|
name: ContentDelta
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/CreateAgentRequest"
|
|
/>
|
|
name: CreateAgentRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/CreateAgentSessionRequest"
|
|
/>
|
|
name: CreateAgentSessionRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/CreateAgentTurnRequest"
|
|
/>
|
|
name: CreateAgentTurnRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/DPOAlignmentConfig"
|
|
/>
|
|
name: DPOAlignmentConfig
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/DataConfig" />
|
|
name: DataConfig
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/Dataset" />
|
|
name: Dataset
|
|
- name: DatasetIO
|
|
- name: Datasets
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/DeleteAgentsRequest"
|
|
/>
|
|
name: DeleteAgentsRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/DeleteAgentsSessionRequest"
|
|
/>
|
|
name: DeleteAgentsSessionRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/EfficiencyConfig"
|
|
/>
|
|
name: EfficiencyConfig
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/EmbeddingsRequest"
|
|
/>
|
|
name: EmbeddingsRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/EmbeddingsResponse"
|
|
/>
|
|
name: EmbeddingsResponse
|
|
- name: Eval
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/EvalTask" />
|
|
name: EvalTask
|
|
- name: EvalTasks
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/EvaluateResponse"
|
|
/>
|
|
name: EvaluateResponse
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/EvaluateRowsRequest"
|
|
/>
|
|
name: EvaluateRowsRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/GetAgentsSessionRequest"
|
|
/>
|
|
name: GetAgentsSessionRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/GetSpanTreeRequest"
|
|
/>
|
|
name: GetSpanTreeRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/GraphMemoryBank"
|
|
/>
|
|
name: GraphMemoryBank
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/GraphMemoryBankParams"
|
|
/>
|
|
name: GraphMemoryBankParams
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/GreedySamplingStrategy"
|
|
/>
|
|
name: GreedySamplingStrategy
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/HealthInfo" />
|
|
name: HealthInfo
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ImageContentItem"
|
|
/>
|
|
name: ImageContentItem
|
|
- name: Inference
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/InferenceStep" />
|
|
name: InferenceStep
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/InsertDocumentsRequest"
|
|
/>
|
|
name: InsertDocumentsRequest
|
|
- name: Inspect
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/InterleavedContent"
|
|
/>
|
|
name: InterleavedContent
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/InterleavedContentItem"
|
|
/>
|
|
name: InterleavedContentItem
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/InvokeToolRequest"
|
|
/>
|
|
name: InvokeToolRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/Job" />
|
|
name: Job
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/JobCancelRequest"
|
|
/>
|
|
name: JobCancelRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/JobStatus" />
|
|
name: JobStatus
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/KeyValueMemoryBank"
|
|
/>
|
|
name: KeyValueMemoryBank
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/KeyValueMemoryBankParams"
|
|
/>
|
|
name: KeyValueMemoryBankParams
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/KeywordMemoryBank"
|
|
/>
|
|
name: KeywordMemoryBank
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/KeywordMemoryBankParams"
|
|
/>
|
|
name: KeywordMemoryBankParams
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/LLMAsJudgeScoringFnParams"
|
|
/>
|
|
name: LLMAsJudgeScoringFnParams
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ListRuntimeToolsRequest"
|
|
/>
|
|
name: ListRuntimeToolsRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/LogEventRequest"
|
|
/>
|
|
name: LogEventRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/LogSeverity" />
|
|
name: LogSeverity
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/LoraFinetuningConfig"
|
|
/>
|
|
name: LoraFinetuningConfig
|
|
- name: Memory
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/MemoryBankDocument"
|
|
/>
|
|
name: MemoryBankDocument
|
|
- name: MemoryBanks
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/MemoryRetrievalStep"
|
|
/>
|
|
name: MemoryRetrievalStep
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/Message" />
|
|
name: Message
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/MetricEvent" />
|
|
name: MetricEvent
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/Model" />
|
|
name: Model
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ModelCandidate" />
|
|
name: ModelCandidate
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ModelType" />
|
|
name: ModelType
|
|
- name: Models
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/OptimizerConfig"
|
|
/>
|
|
name: OptimizerConfig
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/OptimizerType" />
|
|
name: OptimizerType
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/PaginatedRowsResult"
|
|
/>
|
|
name: PaginatedRowsResult
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ParamType" />
|
|
name: ParamType
|
|
- name: PostTraining (Coming Soon)
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/PostTrainingJob"
|
|
/>
|
|
name: PostTrainingJob
|
|
- description: 'Artifacts of a finetuning job.
|
|
|
|
|
|
<SchemaDefinition schemaRef="#/components/schemas/PostTrainingJobArtifactsResponse"
|
|
/>'
|
|
name: PostTrainingJobArtifactsResponse
|
|
- description: 'Status of a finetuning job.
|
|
|
|
|
|
<SchemaDefinition schemaRef="#/components/schemas/PostTrainingJobStatusResponse"
|
|
/>'
|
|
name: PostTrainingJobStatusResponse
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/PreferenceOptimizeRequest"
|
|
/>
|
|
name: PreferenceOptimizeRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ProviderInfo" />
|
|
name: ProviderInfo
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/QATFinetuningConfig"
|
|
/>
|
|
name: QATFinetuningConfig
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/QueryCondition" />
|
|
name: QueryCondition
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/QueryConditionOp"
|
|
/>
|
|
name: QueryConditionOp
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/QueryDocumentsRequest"
|
|
/>
|
|
name: QueryDocumentsRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/QueryDocumentsResponse"
|
|
/>
|
|
name: QueryDocumentsResponse
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/QuerySpansRequest"
|
|
/>
|
|
name: QuerySpansRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/QueryTracesRequest"
|
|
/>
|
|
name: QueryTracesRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/RegexParserScoringFnParams"
|
|
/>
|
|
name: RegexParserScoringFnParams
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/RegisterDatasetRequest"
|
|
/>
|
|
name: RegisterDatasetRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/RegisterEvalTaskRequest"
|
|
/>
|
|
name: RegisterEvalTaskRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/RegisterMemoryBankRequest"
|
|
/>
|
|
name: RegisterMemoryBankRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/RegisterModelRequest"
|
|
/>
|
|
name: RegisterModelRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/RegisterScoringFunctionRequest"
|
|
/>
|
|
name: RegisterScoringFunctionRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/RegisterShieldRequest"
|
|
/>
|
|
name: RegisterShieldRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/RegisterToolGroupRequest"
|
|
/>
|
|
name: RegisterToolGroupRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ResponseFormat" />
|
|
name: ResponseFormat
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/RouteInfo" />
|
|
name: RouteInfo
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/RunEvalRequest" />
|
|
name: RunEvalRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/RunShieldRequest"
|
|
/>
|
|
name: RunShieldRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/RunShieldResponse"
|
|
/>
|
|
name: RunShieldResponse
|
|
- name: Safety
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/SafetyViolation"
|
|
/>
|
|
name: SafetyViolation
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/SamplingParams" />
|
|
name: SamplingParams
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/SaveSpansToDatasetRequest"
|
|
/>
|
|
name: SaveSpansToDatasetRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ScoreBatchRequest"
|
|
/>
|
|
name: ScoreBatchRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ScoreBatchResponse"
|
|
/>
|
|
name: ScoreBatchResponse
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ScoreRequest" />
|
|
name: ScoreRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ScoreResponse" />
|
|
name: ScoreResponse
|
|
- name: Scoring
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ScoringFn" />
|
|
name: ScoringFn
|
|
- name: ScoringFunctions
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ScoringResult" />
|
|
name: ScoringResult
|
|
- description: 'A single session of an interaction with an Agentic System.
|
|
|
|
|
|
<SchemaDefinition schemaRef="#/components/schemas/Session" />'
|
|
name: Session
|
|
- description: 'A safety shield resource that can be used to check content
|
|
|
|
|
|
<SchemaDefinition schemaRef="#/components/schemas/Shield" />'
|
|
name: Shield
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ShieldCallStep" />
|
|
name: ShieldCallStep
|
|
- name: Shields
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/Span" />
|
|
name: Span
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/SpanEndPayload" />
|
|
name: SpanEndPayload
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/SpanStartPayload"
|
|
/>
|
|
name: SpanStartPayload
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/SpanStatus" />
|
|
name: SpanStatus
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/SpanWithStatus" />
|
|
name: SpanWithStatus
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/StopReason" />
|
|
name: StopReason
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/StructuredLogEvent"
|
|
/>
|
|
name: StructuredLogEvent
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/SupervisedFineTuneRequest"
|
|
/>
|
|
name: SupervisedFineTuneRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/SyntheticDataGenerateRequest"
|
|
/>
|
|
name: SyntheticDataGenerateRequest
|
|
- name: SyntheticDataGeneration (Coming Soon)
|
|
- description: 'Response from the synthetic data generation. Batch of (prompt, response,
|
|
score) tuples that pass the threshold.
|
|
|
|
|
|
<SchemaDefinition schemaRef="#/components/schemas/SyntheticDataGenerationResponse"
|
|
/>'
|
|
name: SyntheticDataGenerationResponse
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/SystemMessage" />
|
|
name: SystemMessage
|
|
- name: Telemetry
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/TextContentItem"
|
|
/>
|
|
name: TextContentItem
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/TokenLogProbs" />
|
|
name: TokenLogProbs
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/Tool" />
|
|
name: Tool
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ToolCall" />
|
|
name: ToolCall
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ToolCallDelta" />
|
|
name: ToolCallDelta
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ToolCallParseStatus"
|
|
/>
|
|
name: ToolCallParseStatus
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ToolChoice" />
|
|
name: ToolChoice
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ToolDef" />
|
|
name: ToolDef
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ToolDefinition" />
|
|
name: ToolDefinition
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ToolExecutionStep"
|
|
/>
|
|
name: ToolExecutionStep
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ToolGroup" />
|
|
name: ToolGroup
|
|
- name: ToolGroups
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ToolHost" />
|
|
name: ToolHost
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ToolInvocationResult"
|
|
/>
|
|
name: ToolInvocationResult
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ToolParamDefinition"
|
|
/>
|
|
name: ToolParamDefinition
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ToolParameter" />
|
|
name: ToolParameter
|
|
- description: "This Enum refers to the prompt format for calling custom / zero shot\
|
|
\ tools\n\n`json` --\n Refers to the json format for calling tools.\n The\
|
|
\ json format takes the form like\n {\n \"type\": \"function\",\n \
|
|
\ \"function\" : {\n \"name\": \"function_name\",\n \
|
|
\ \"description\": \"function_description\",\n \"parameters\": {...}\n\
|
|
\ }\n }\n\n`function_tag` --\n This is an example of how you could\
|
|
\ define\n your own user defined format for making tool calls.\n The function_tag\
|
|
\ format looks like this,\n <function=function_name>(parameters)</function>\n\
|
|
\nThe detailed prompts for each of these formats are added to llama cli\n\n<SchemaDefinition\
|
|
\ schemaRef=\"#/components/schemas/ToolPromptFormat\" />"
|
|
name: ToolPromptFormat
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ToolResponse" />
|
|
name: ToolResponse
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ToolResponseMessage"
|
|
/>
|
|
name: ToolResponseMessage
|
|
- name: ToolRuntime
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/TopKSamplingStrategy"
|
|
/>
|
|
name: TopKSamplingStrategy
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/TopPSamplingStrategy"
|
|
/>
|
|
name: TopPSamplingStrategy
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/Trace" />
|
|
name: Trace
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/TrainingConfig" />
|
|
name: TrainingConfig
|
|
- description: 'A single turn in an interaction with an Agentic System.
|
|
|
|
|
|
<SchemaDefinition schemaRef="#/components/schemas/Turn" />'
|
|
name: Turn
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/URL" />
|
|
name: URL
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/UnregisterDatasetRequest"
|
|
/>
|
|
name: UnregisterDatasetRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/UnregisterMemoryBankRequest"
|
|
/>
|
|
name: UnregisterMemoryBankRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/UnregisterModelRequest"
|
|
/>
|
|
name: UnregisterModelRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/UnregisterToolGroupRequest"
|
|
/>
|
|
name: UnregisterToolGroupRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/UnstructuredLogEvent"
|
|
/>
|
|
name: UnstructuredLogEvent
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/UserMessage" />
|
|
name: UserMessage
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/VectorMemoryBank"
|
|
/>
|
|
name: VectorMemoryBank
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/VectorMemoryBankParams"
|
|
/>
|
|
name: VectorMemoryBankParams
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/VersionInfo" />
|
|
name: VersionInfo
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ViolationLevel" />
|
|
name: ViolationLevel
|
|
x-tagGroups:
|
|
- name: Operations
|
|
tags:
|
|
- Agents
|
|
- BatchInference (Coming Soon)
|
|
- DatasetIO
|
|
- Datasets
|
|
- Eval
|
|
- EvalTasks
|
|
- Inference
|
|
- Inspect
|
|
- Memory
|
|
- MemoryBanks
|
|
- Models
|
|
- PostTraining (Coming Soon)
|
|
- Safety
|
|
- Scoring
|
|
- ScoringFunctions
|
|
- Shields
|
|
- SyntheticDataGeneration (Coming Soon)
|
|
- Telemetry
|
|
- ToolGroups
|
|
- ToolRuntime
|
|
- name: Types
|
|
tags:
|
|
- AgentCandidate
|
|
- AgentConfig
|
|
- AgentCreateResponse
|
|
- AgentSessionCreateResponse
|
|
- AgentStepResponse
|
|
- AgentTool
|
|
- AgentTurnResponseEvent
|
|
- AgentTurnResponseStepCompletePayload
|
|
- AgentTurnResponseStepProgressPayload
|
|
- AgentTurnResponseStepStartPayload
|
|
- AgentTurnResponseStreamChunk
|
|
- AgentTurnResponseTurnCompletePayload
|
|
- AgentTurnResponseTurnStartPayload
|
|
- AggregationFunctionType
|
|
- AppEvalTaskConfig
|
|
- AppendRowsRequest
|
|
- BasicScoringFnParams
|
|
- BatchChatCompletionRequest
|
|
- BatchChatCompletionResponse
|
|
- BatchCompletionRequest
|
|
- BatchCompletionResponse
|
|
- BenchmarkEvalTaskConfig
|
|
- BuiltinTool
|
|
- CancelTrainingJobRequest
|
|
- ChatCompletionRequest
|
|
- ChatCompletionResponse
|
|
- ChatCompletionResponseEvent
|
|
- ChatCompletionResponseEventType
|
|
- ChatCompletionResponseStreamChunk
|
|
- Checkpoint
|
|
- CompletionMessage
|
|
- CompletionRequest
|
|
- CompletionResponse
|
|
- CompletionResponseStreamChunk
|
|
- ContentDelta
|
|
- CreateAgentRequest
|
|
- CreateAgentSessionRequest
|
|
- CreateAgentTurnRequest
|
|
- DPOAlignmentConfig
|
|
- DataConfig
|
|
- Dataset
|
|
- DeleteAgentsRequest
|
|
- DeleteAgentsSessionRequest
|
|
- EfficiencyConfig
|
|
- EmbeddingsRequest
|
|
- EmbeddingsResponse
|
|
- EvalTask
|
|
- EvaluateResponse
|
|
- EvaluateRowsRequest
|
|
- GetAgentsSessionRequest
|
|
- GetSpanTreeRequest
|
|
- GraphMemoryBank
|
|
- GraphMemoryBankParams
|
|
- GreedySamplingStrategy
|
|
- HealthInfo
|
|
- ImageContentItem
|
|
- InferenceStep
|
|
- InsertDocumentsRequest
|
|
- InterleavedContent
|
|
- InterleavedContentItem
|
|
- InvokeToolRequest
|
|
- Job
|
|
- JobCancelRequest
|
|
- JobStatus
|
|
- KeyValueMemoryBank
|
|
- KeyValueMemoryBankParams
|
|
- KeywordMemoryBank
|
|
- KeywordMemoryBankParams
|
|
- LLMAsJudgeScoringFnParams
|
|
- ListRuntimeToolsRequest
|
|
- LogEventRequest
|
|
- LogSeverity
|
|
- LoraFinetuningConfig
|
|
- MemoryBankDocument
|
|
- MemoryRetrievalStep
|
|
- Message
|
|
- MetricEvent
|
|
- Model
|
|
- ModelCandidate
|
|
- ModelType
|
|
- OptimizerConfig
|
|
- OptimizerType
|
|
- PaginatedRowsResult
|
|
- ParamType
|
|
- PostTrainingJob
|
|
- PostTrainingJobArtifactsResponse
|
|
- PostTrainingJobStatusResponse
|
|
- PreferenceOptimizeRequest
|
|
- ProviderInfo
|
|
- QATFinetuningConfig
|
|
- QueryCondition
|
|
- QueryConditionOp
|
|
- QueryDocumentsRequest
|
|
- QueryDocumentsResponse
|
|
- QuerySpansRequest
|
|
- QueryTracesRequest
|
|
- RegexParserScoringFnParams
|
|
- RegisterDatasetRequest
|
|
- RegisterEvalTaskRequest
|
|
- RegisterMemoryBankRequest
|
|
- RegisterModelRequest
|
|
- RegisterScoringFunctionRequest
|
|
- RegisterShieldRequest
|
|
- RegisterToolGroupRequest
|
|
- ResponseFormat
|
|
- RouteInfo
|
|
- RunEvalRequest
|
|
- RunShieldRequest
|
|
- RunShieldResponse
|
|
- SafetyViolation
|
|
- SamplingParams
|
|
- SaveSpansToDatasetRequest
|
|
- ScoreBatchRequest
|
|
- ScoreBatchResponse
|
|
- ScoreRequest
|
|
- ScoreResponse
|
|
- ScoringFn
|
|
- ScoringResult
|
|
- Session
|
|
- Shield
|
|
- ShieldCallStep
|
|
- Span
|
|
- SpanEndPayload
|
|
- SpanStartPayload
|
|
- SpanStatus
|
|
- SpanWithStatus
|
|
- StopReason
|
|
- StructuredLogEvent
|
|
- SupervisedFineTuneRequest
|
|
- SyntheticDataGenerateRequest
|
|
- SyntheticDataGenerationResponse
|
|
- SystemMessage
|
|
- TextContentItem
|
|
- TokenLogProbs
|
|
- Tool
|
|
- ToolCall
|
|
- ToolCallDelta
|
|
- ToolCallParseStatus
|
|
- ToolChoice
|
|
- ToolDef
|
|
- ToolDefinition
|
|
- ToolExecutionStep
|
|
- ToolGroup
|
|
- ToolHost
|
|
- ToolInvocationResult
|
|
- ToolParamDefinition
|
|
- ToolParameter
|
|
- ToolPromptFormat
|
|
- ToolResponse
|
|
- ToolResponseMessage
|
|
- TopKSamplingStrategy
|
|
- TopPSamplingStrategy
|
|
- Trace
|
|
- TrainingConfig
|
|
- Turn
|
|
- URL
|
|
- UnregisterDatasetRequest
|
|
- UnregisterMemoryBankRequest
|
|
- UnregisterModelRequest
|
|
- UnregisterToolGroupRequest
|
|
- UnstructuredLogEvent
|
|
- UserMessage
|
|
- VectorMemoryBank
|
|
- VectorMemoryBankParams
|
|
- VersionInfo
|
|
- ViolationLevel
|