llama-stack/docs/resources/llama-stack-spec.yaml
Ashwin Bharambe ec4fc800cc
[API Updates] Model / shield / memory-bank routing + agent persistence + support for private headers (#92)
This is yet another of those large PRs (hopefully we will have less and less of them as things mature fast). This one introduces substantial improvements and some simplifications to the stack.

Most important bits:

* Agents reference implementation now has support for session / turn persistence. The default implementation uses sqlite but there's also support for using Redis.

* We have re-architected the structure of the Stack APIs to allow for more flexible routing. The motivating use cases are:
  - routing model A to ollama and model B to a remote provider like Together
  - routing shield A to local impl while shield B to a remote provider like Bedrock
  - routing a vector memory bank to Weaviate while routing a keyvalue memory bank to Redis

* Support for provider specific parameters to be passed from the clients. A client can pass data using `x_llamastack_provider_data` parameter which can be type-checked and provided to the Adapter implementations.
2024-09-23 14:22:22 -07:00

4307 lines
114 KiB
YAML

components:
responses: {}
schemas:
AgentConfig:
additionalProperties: false
properties:
enable_session_persistence:
type: boolean
input_shields:
items:
type: string
type: array
instructions:
type: string
max_infer_iters:
default: 10
type: integer
model:
type: string
output_shields:
items:
type: string
type: array
sampling_params:
$ref: '#/components/schemas/SamplingParams'
tool_choice:
$ref: '#/components/schemas/ToolChoice'
default: auto
tool_prompt_format:
$ref: '#/components/schemas/ToolPromptFormat'
default: json
tools:
items:
oneOf:
- $ref: '#/components/schemas/SearchToolDefinition'
- $ref: '#/components/schemas/WolframAlphaToolDefinition'
- $ref: '#/components/schemas/PhotogenToolDefinition'
- $ref: '#/components/schemas/CodeInterpreterToolDefinition'
- $ref: '#/components/schemas/FunctionCallToolDefinition'
- $ref: '#/components/schemas/MemoryToolDefinition'
type: array
required:
- max_infer_iters
- model
- instructions
- enable_session_persistence
type: object
AgentCreateResponse:
additionalProperties: false
properties:
agent_id:
type: string
required:
- agent_id
type: object
AgentSessionCreateResponse:
additionalProperties: false
properties:
session_id:
type: string
required:
- session_id
type: object
AgentStepResponse:
additionalProperties: false
properties:
step:
oneOf:
- $ref: '#/components/schemas/InferenceStep'
- $ref: '#/components/schemas/ToolExecutionStep'
- $ref: '#/components/schemas/ShieldCallStep'
- $ref: '#/components/schemas/MemoryRetrievalStep'
required:
- step
type: object
AgentTurnResponseEvent:
additionalProperties: false
properties:
payload:
oneOf:
- $ref: '#/components/schemas/AgentTurnResponseStepStartPayload'
- $ref: '#/components/schemas/AgentTurnResponseStepProgressPayload'
- $ref: '#/components/schemas/AgentTurnResponseStepCompletePayload'
- $ref: '#/components/schemas/AgentTurnResponseTurnStartPayload'
- $ref: '#/components/schemas/AgentTurnResponseTurnCompletePayload'
required:
- payload
title: Streamed agent execution response.
type: object
AgentTurnResponseStepCompletePayload:
additionalProperties: false
properties:
event_type:
const: step_complete
default: step_complete
type: string
step_details:
oneOf:
- $ref: '#/components/schemas/InferenceStep'
- $ref: '#/components/schemas/ToolExecutionStep'
- $ref: '#/components/schemas/ShieldCallStep'
- $ref: '#/components/schemas/MemoryRetrievalStep'
step_type:
enum:
- inference
- tool_execution
- shield_call
- memory_retrieval
type: string
required:
- event_type
- step_type
- step_details
type: object
AgentTurnResponseStepProgressPayload:
additionalProperties: false
properties:
event_type:
const: step_progress
default: step_progress
type: string
model_response_text_delta:
type: string
step_id:
type: string
step_type:
enum:
- inference
- tool_execution
- shield_call
- memory_retrieval
type: string
tool_call_delta:
$ref: '#/components/schemas/ToolCallDelta'
tool_response_text_delta:
type: string
required:
- event_type
- step_type
- step_id
type: object
AgentTurnResponseStepStartPayload:
additionalProperties: false
properties:
event_type:
const: step_start
default: step_start
type: string
metadata:
additionalProperties:
oneOf:
- type: 'null'
- type: boolean
- type: number
- type: string
- type: array
- type: object
type: object
step_id:
type: string
step_type:
enum:
- inference
- tool_execution
- shield_call
- memory_retrieval
type: string
required:
- event_type
- step_type
- step_id
type: object
AgentTurnResponseStreamChunk:
additionalProperties: false
properties:
event:
$ref: '#/components/schemas/AgentTurnResponseEvent'
required:
- event
type: object
AgentTurnResponseTurnCompletePayload:
additionalProperties: false
properties:
event_type:
const: turn_complete
default: turn_complete
type: string
turn:
$ref: '#/components/schemas/Turn'
required:
- event_type
- turn
type: object
AgentTurnResponseTurnStartPayload:
additionalProperties: false
properties:
event_type:
const: turn_start
default: turn_start
type: string
turn_id:
type: string
required:
- event_type
- turn_id
type: object
Attachment:
additionalProperties: false
properties:
content:
oneOf:
- type: string
- items:
type: string
type: array
- $ref: '#/components/schemas/URL'
mime_type:
type: string
required:
- content
- mime_type
type: object
BatchChatCompletionRequest:
additionalProperties: false
properties:
logprobs:
additionalProperties: false
properties:
top_k:
default: 0
type: integer
type: object
messages_batch:
items:
items:
oneOf:
- $ref: '#/components/schemas/UserMessage'
- $ref: '#/components/schemas/SystemMessage'
- $ref: '#/components/schemas/ToolResponseMessage'
- $ref: '#/components/schemas/CompletionMessage'
type: array
type: array
model:
type: string
sampling_params:
$ref: '#/components/schemas/SamplingParams'
tool_choice:
$ref: '#/components/schemas/ToolChoice'
tool_prompt_format:
$ref: '#/components/schemas/ToolPromptFormat'
tools:
items:
$ref: '#/components/schemas/ToolDefinition'
type: array
required:
- model
- messages_batch
type: object
BatchChatCompletionResponse:
additionalProperties: false
properties:
completion_message_batch:
items:
$ref: '#/components/schemas/CompletionMessage'
type: array
required:
- completion_message_batch
type: object
BatchCompletionRequest:
additionalProperties: false
properties:
content_batch:
items:
oneOf:
- type: string
- items:
type: string
type: array
type: array
logprobs:
additionalProperties: false
properties:
top_k:
default: 0
type: integer
type: object
model:
type: string
sampling_params:
$ref: '#/components/schemas/SamplingParams'
required:
- model
- content_batch
type: object
BatchCompletionResponse:
additionalProperties: false
properties:
completion_message_batch:
items:
$ref: '#/components/schemas/CompletionMessage'
type: array
required:
- completion_message_batch
type: object
BuiltinTool:
enum:
- brave_search
- wolfram_alpha
- photogen
- code_interpreter
type: string
CancelEvaluationJobRequest:
additionalProperties: false
properties:
job_uuid:
type: string
required:
- job_uuid
type: object
CancelTrainingJobRequest:
additionalProperties: false
properties:
job_uuid:
type: string
required:
- job_uuid
type: object
ChatCompletionRequest:
additionalProperties: false
properties:
logprobs:
additionalProperties: false
properties:
top_k:
default: 0
type: integer
type: object
messages:
items:
oneOf:
- $ref: '#/components/schemas/UserMessage'
- $ref: '#/components/schemas/SystemMessage'
- $ref: '#/components/schemas/ToolResponseMessage'
- $ref: '#/components/schemas/CompletionMessage'
type: array
model:
type: string
sampling_params:
$ref: '#/components/schemas/SamplingParams'
stream:
type: boolean
tool_choice:
$ref: '#/components/schemas/ToolChoice'
tool_prompt_format:
$ref: '#/components/schemas/ToolPromptFormat'
tools:
items:
$ref: '#/components/schemas/ToolDefinition'
type: array
required:
- model
- messages
type: object
ChatCompletionResponse:
additionalProperties: false
properties:
completion_message:
$ref: '#/components/schemas/CompletionMessage'
logprobs:
items:
$ref: '#/components/schemas/TokenLogProbs'
type: array
required:
- completion_message
title: Chat completion response.
type: object
ChatCompletionResponseEvent:
additionalProperties: false
properties:
delta:
oneOf:
- type: string
- $ref: '#/components/schemas/ToolCallDelta'
event_type:
$ref: '#/components/schemas/ChatCompletionResponseEventType'
logprobs:
items:
$ref: '#/components/schemas/TokenLogProbs'
type: array
stop_reason:
$ref: '#/components/schemas/StopReason'
required:
- event_type
- delta
title: Chat completion response event.
type: object
ChatCompletionResponseEventType:
enum:
- start
- complete
- progress
type: string
ChatCompletionResponseStreamChunk:
additionalProperties: false
properties:
event:
$ref: '#/components/schemas/ChatCompletionResponseEvent'
required:
- event
title: SSE-stream of these events.
type: object
Checkpoint:
description: Checkpoint created during training runs
CodeInterpreterToolDefinition:
additionalProperties: false
properties:
enable_inline_code_execution:
default: true
type: boolean
input_shields:
items:
type: string
type: array
output_shields:
items:
type: string
type: array
remote_execution:
$ref: '#/components/schemas/RestAPIExecutionConfig'
type:
const: code_interpreter
default: code_interpreter
type: string
required:
- type
- enable_inline_code_execution
type: object
CompletionMessage:
additionalProperties: false
properties:
content:
oneOf:
- type: string
- items:
type: string
type: array
role:
const: assistant
default: assistant
type: string
stop_reason:
$ref: '#/components/schemas/StopReason'
tool_calls:
items:
$ref: '#/components/schemas/ToolCall'
type: array
required:
- role
- content
- stop_reason
- tool_calls
type: object
CompletionRequest:
additionalProperties: false
properties:
content:
oneOf:
- type: string
- items:
type: string
type: array
logprobs:
additionalProperties: false
properties:
top_k:
default: 0
type: integer
type: object
model:
type: string
sampling_params:
$ref: '#/components/schemas/SamplingParams'
stream:
type: boolean
required:
- model
- content
type: object
CompletionResponse:
additionalProperties: false
properties:
completion_message:
$ref: '#/components/schemas/CompletionMessage'
logprobs:
items:
$ref: '#/components/schemas/TokenLogProbs'
type: array
required:
- completion_message
title: Completion response.
type: object
CompletionResponseStreamChunk:
additionalProperties: false
properties:
delta:
type: string
logprobs:
items:
$ref: '#/components/schemas/TokenLogProbs'
type: array
stop_reason:
$ref: '#/components/schemas/StopReason'
required:
- delta
title: streamed completion response.
type: object
CreateAgentRequest:
additionalProperties: false
properties:
agent_config:
$ref: '#/components/schemas/AgentConfig'
required:
- agent_config
type: object
CreateAgentSessionRequest:
additionalProperties: false
properties:
agent_id:
type: string
session_name:
type: string
required:
- agent_id
- session_name
type: object
CreateAgentTurnRequest:
additionalProperties: false
properties:
agent_id:
type: string
attachments:
items:
$ref: '#/components/schemas/Attachment'
type: array
messages:
items:
oneOf:
- $ref: '#/components/schemas/UserMessage'
- $ref: '#/components/schemas/ToolResponseMessage'
type: array
session_id:
type: string
stream:
type: boolean
required:
- agent_id
- session_id
- messages
type: object
CreateDatasetRequest:
additionalProperties: false
properties:
dataset:
$ref: '#/components/schemas/TrainEvalDataset'
uuid:
type: string
required:
- uuid
- dataset
type: object
CreateMemoryBankRequest:
additionalProperties: false
properties:
config:
oneOf:
- additionalProperties: false
properties:
chunk_size_in_tokens:
type: integer
embedding_model:
type: string
overlap_size_in_tokens:
type: integer
type:
const: vector
default: vector
type: string
required:
- type
- embedding_model
- chunk_size_in_tokens
type: object
- additionalProperties: false
properties:
type:
const: keyvalue
default: keyvalue
type: string
required:
- type
type: object
- additionalProperties: false
properties:
type:
const: keyword
default: keyword
type: string
required:
- type
type: object
- additionalProperties: false
properties:
type:
const: graph
default: graph
type: string
required:
- type
type: object
name:
type: string
url:
$ref: '#/components/schemas/URL'
required:
- name
- config
type: object
DPOAlignmentConfig:
additionalProperties: false
properties:
epsilon:
type: number
gamma:
type: number
reward_clip:
type: number
reward_scale:
type: number
required:
- reward_scale
- reward_clip
- epsilon
- gamma
type: object
DeleteAgentsRequest:
additionalProperties: false
properties:
agent_id:
type: string
required:
- agent_id
type: object
DeleteAgentsSessionRequest:
additionalProperties: false
properties:
agent_id:
type: string
session_id:
type: string
required:
- agent_id
- session_id
type: object
DeleteDatasetRequest:
additionalProperties: false
properties:
dataset_uuid:
type: string
required:
- dataset_uuid
type: object
DeleteDocumentsRequest:
additionalProperties: false
properties:
bank_id:
type: string
document_ids:
items:
type: string
type: array
required:
- bank_id
- document_ids
type: object
DialogGenerations:
additionalProperties: false
properties:
dialog:
items:
oneOf:
- $ref: '#/components/schemas/UserMessage'
- $ref: '#/components/schemas/SystemMessage'
- $ref: '#/components/schemas/ToolResponseMessage'
- $ref: '#/components/schemas/CompletionMessage'
type: array
sampled_generations:
items:
oneOf:
- $ref: '#/components/schemas/UserMessage'
- $ref: '#/components/schemas/SystemMessage'
- $ref: '#/components/schemas/ToolResponseMessage'
- $ref: '#/components/schemas/CompletionMessage'
type: array
required:
- dialog
- sampled_generations
type: object
DoraFinetuningConfig:
additionalProperties: false
properties:
alpha:
type: integer
apply_lora_to_mlp:
type: boolean
apply_lora_to_output:
type: boolean
lora_attn_modules:
items:
type: string
type: array
rank:
type: integer
required:
- lora_attn_modules
- apply_lora_to_mlp
- apply_lora_to_output
- rank
- alpha
type: object
DropMemoryBankRequest:
additionalProperties: false
properties:
bank_id:
type: string
required:
- bank_id
type: object
EmbeddingsRequest:
additionalProperties: false
properties:
contents:
items:
oneOf:
- type: string
- items:
type: string
type: array
type: array
model:
type: string
required:
- model
- contents
type: object
EmbeddingsResponse:
additionalProperties: false
properties:
embeddings:
items:
items:
type: number
type: array
type: array
required:
- embeddings
type: object
EvaluateQuestionAnsweringRequest:
additionalProperties: false
properties:
metrics:
items:
enum:
- em
- f1
type: string
type: array
required:
- metrics
type: object
EvaluateSummarizationRequest:
additionalProperties: false
properties:
metrics:
items:
enum:
- rouge
- bleu
type: string
type: array
required:
- metrics
type: object
EvaluateTextGenerationRequest:
additionalProperties: false
properties:
metrics:
items:
enum:
- perplexity
- rouge
- bleu
type: string
type: array
required:
- metrics
type: object
EvaluationJob:
additionalProperties: false
properties:
job_uuid:
type: string
required:
- job_uuid
type: object
EvaluationJobArtifactsResponse:
additionalProperties: false
properties:
job_uuid:
type: string
required:
- job_uuid
title: Artifacts of a evaluation job.
type: object
EvaluationJobLogStream:
additionalProperties: false
properties:
job_uuid:
type: string
required:
- job_uuid
type: object
EvaluationJobStatusResponse:
additionalProperties: false
properties:
job_uuid:
type: string
required:
- job_uuid
type: object
FinetuningAlgorithm:
enum:
- full
- lora
- qlora
- dora
type: string
FunctionCallToolDefinition:
additionalProperties: false
properties:
description:
type: string
function_name:
type: string
input_shields:
items:
type: string
type: array
output_shields:
items:
type: string
type: array
parameters:
additionalProperties:
$ref: '#/components/schemas/ToolParamDefinition'
type: object
remote_execution:
$ref: '#/components/schemas/RestAPIExecutionConfig'
type:
const: function_call
default: function_call
type: string
required:
- type
- function_name
- description
- parameters
type: object
GetAgentsSessionRequest:
additionalProperties: false
properties:
turn_ids:
items:
type: string
type: array
type: object
GetDocumentsRequest:
additionalProperties: false
properties:
document_ids:
items:
type: string
type: array
required:
- document_ids
type: object
InferenceStep:
additionalProperties: false
properties:
completed_at:
format: date-time
type: string
model_response:
$ref: '#/components/schemas/CompletionMessage'
started_at:
format: date-time
type: string
step_id:
type: string
step_type:
const: inference
default: inference
type: string
turn_id:
type: string
required:
- turn_id
- step_id
- step_type
- model_response
type: object
InsertDocumentsRequest:
additionalProperties: false
properties:
bank_id:
type: string
documents:
items:
$ref: '#/components/schemas/MemoryBankDocument'
type: array
ttl_seconds:
type: integer
required:
- bank_id
- documents
type: object
LogEventRequest:
additionalProperties: false
properties:
event:
oneOf:
- $ref: '#/components/schemas/UnstructuredLogEvent'
- $ref: '#/components/schemas/MetricEvent'
- $ref: '#/components/schemas/StructuredLogEvent'
required:
- event
type: object
LogSeverity:
enum:
- verbose
- debug
- info
- warn
- error
- critical
type: string
LoraFinetuningConfig:
additionalProperties: false
properties:
alpha:
type: integer
apply_lora_to_mlp:
type: boolean
apply_lora_to_output:
type: boolean
lora_attn_modules:
items:
type: string
type: array
rank:
type: integer
required:
- lora_attn_modules
- apply_lora_to_mlp
- apply_lora_to_output
- rank
- alpha
type: object
MemoryBank:
additionalProperties: false
properties:
bank_id:
type: string
config:
oneOf:
- additionalProperties: false
properties:
chunk_size_in_tokens:
type: integer
embedding_model:
type: string
overlap_size_in_tokens:
type: integer
type:
const: vector
default: vector
type: string
required:
- type
- embedding_model
- chunk_size_in_tokens
type: object
- additionalProperties: false
properties:
type:
const: keyvalue
default: keyvalue
type: string
required:
- type
type: object
- additionalProperties: false
properties:
type:
const: keyword
default: keyword
type: string
required:
- type
type: object
- additionalProperties: false
properties:
type:
const: graph
default: graph
type: string
required:
- type
type: object
name:
type: string
url:
$ref: '#/components/schemas/URL'
required:
- bank_id
- name
- config
type: object
MemoryBankDocument:
additionalProperties: false
properties:
content:
oneOf:
- type: string
- items:
type: string
type: array
- $ref: '#/components/schemas/URL'
document_id:
type: string
metadata:
additionalProperties:
oneOf:
- type: 'null'
- type: boolean
- type: number
- type: string
- type: array
- type: object
type: object
mime_type:
type: string
required:
- document_id
- content
- metadata
type: object
MemoryBankSpec:
additionalProperties: false
properties:
bank_type:
$ref: '#/components/schemas/MemoryBankType'
provider_config:
additionalProperties: false
properties:
config:
additionalProperties:
oneOf:
- type: 'null'
- type: boolean
- type: number
- type: string
- type: array
- type: object
type: object
provider_id:
type: string
required:
- provider_id
- config
type: object
required:
- bank_type
- provider_config
type: object
MemoryBankType:
enum:
- vector
- keyvalue
- keyword
- graph
type: string
MemoryRetrievalStep:
additionalProperties: false
properties:
completed_at:
format: date-time
type: string
inserted_context:
oneOf:
- type: string
- items:
type: string
type: array
memory_bank_ids:
items:
type: string
type: array
started_at:
format: date-time
type: string
step_id:
type: string
step_type:
const: memory_retrieval
default: memory_retrieval
type: string
turn_id:
type: string
required:
- turn_id
- step_id
- step_type
- memory_bank_ids
- inserted_context
type: object
MemoryToolDefinition:
additionalProperties: false
properties:
input_shields:
items:
type: string
type: array
max_chunks:
default: 10
type: integer
max_tokens_in_context:
default: 4096
type: integer
memory_bank_configs:
items:
oneOf:
- additionalProperties: false
properties:
bank_id:
type: string
type:
const: vector
default: vector
type: string
required:
- bank_id
- type
type: object
- additionalProperties: false
properties:
bank_id:
type: string
keys:
items:
type: string
type: array
type:
const: keyvalue
default: keyvalue
type: string
required:
- bank_id
- type
- keys
type: object
- additionalProperties: false
properties:
bank_id:
type: string
type:
const: keyword
default: keyword
type: string
required:
- bank_id
- type
type: object
- additionalProperties: false
properties:
bank_id:
type: string
entities:
items:
type: string
type: array
type:
const: graph
default: graph
type: string
required:
- bank_id
- type
- entities
type: object
type: array
output_shields:
items:
type: string
type: array
query_generator_config:
oneOf:
- additionalProperties: false
properties:
sep:
default: ' '
type: string
type:
const: default
default: default
type: string
required:
- type
- sep
type: object
- additionalProperties: false
properties:
model:
type: string
template:
type: string
type:
const: llm
default: llm
type: string
required:
- type
- model
- template
type: object
- additionalProperties: false
properties:
type:
const: custom
default: custom
type: string
required:
- type
type: object
type:
const: memory
default: memory
type: string
required:
- type
- memory_bank_configs
- query_generator_config
- max_tokens_in_context
- max_chunks
type: object
MetricEvent:
additionalProperties: false
properties:
attributes:
additionalProperties:
oneOf:
- type: 'null'
- type: boolean
- type: number
- type: string
- type: array
- type: object
type: object
metric:
type: string
span_id:
type: string
timestamp:
format: date-time
type: string
trace_id:
type: string
type:
const: metric
default: metric
type: string
unit:
type: string
value:
oneOf:
- type: integer
- type: number
required:
- trace_id
- span_id
- timestamp
- type
- metric
- value
- unit
type: object
Model:
description: The model family and SKU of the model along with other parameters
corresponding to the model.
ModelServingSpec:
additionalProperties: false
properties:
llama_model:
$ref: '#/components/schemas/Model'
provider_config:
additionalProperties: false
properties:
config:
additionalProperties:
oneOf:
- type: 'null'
- type: boolean
- type: number
- type: string
- type: array
- type: object
type: object
provider_id:
type: string
required:
- provider_id
- config
type: object
required:
- llama_model
- provider_config
type: object
OptimizerConfig:
additionalProperties: false
properties:
lr:
type: number
lr_min:
type: number
optimizer_type:
enum:
- adam
- adamw
- sgd
type: string
weight_decay:
type: number
required:
- optimizer_type
- lr
- lr_min
- weight_decay
type: object
PhotogenToolDefinition:
additionalProperties: false
properties:
input_shields:
items:
type: string
type: array
output_shields:
items:
type: string
type: array
remote_execution:
$ref: '#/components/schemas/RestAPIExecutionConfig'
type:
const: photogen
default: photogen
type: string
required:
- type
type: object
PostTrainingJob:
additionalProperties: false
properties:
job_uuid:
type: string
required:
- job_uuid
type: object
PostTrainingJobArtifactsResponse:
additionalProperties: false
properties:
checkpoints:
items:
$ref: '#/components/schemas/Checkpoint'
type: array
job_uuid:
type: string
required:
- job_uuid
- checkpoints
title: Artifacts of a finetuning job.
type: object
PostTrainingJobLogStream:
additionalProperties: false
properties:
job_uuid:
type: string
log_lines:
items:
type: string
type: array
required:
- job_uuid
- log_lines
title: Stream of logs from a finetuning job.
type: object
PostTrainingJobStatus:
enum:
- running
- completed
- failed
- scheduled
type: string
PostTrainingJobStatusResponse:
additionalProperties: false
properties:
checkpoints:
items:
$ref: '#/components/schemas/Checkpoint'
type: array
completed_at:
format: date-time
type: string
job_uuid:
type: string
resources_allocated:
additionalProperties:
oneOf:
- type: 'null'
- type: boolean
- type: number
- type: string
- type: array
- type: object
type: object
scheduled_at:
format: date-time
type: string
started_at:
format: date-time
type: string
status:
$ref: '#/components/schemas/PostTrainingJobStatus'
required:
- job_uuid
- status
- checkpoints
title: Status of a finetuning job.
type: object
PreferenceOptimizeRequest:
additionalProperties: false
properties:
algorithm:
$ref: '#/components/schemas/RLHFAlgorithm'
algorithm_config:
$ref: '#/components/schemas/DPOAlignmentConfig'
dataset:
$ref: '#/components/schemas/TrainEvalDataset'
finetuned_model:
$ref: '#/components/schemas/URL'
hyperparam_search_config:
additionalProperties:
oneOf:
- type: 'null'
- type: boolean
- type: number
- type: string
- type: array
- type: object
type: object
job_uuid:
type: string
logger_config:
additionalProperties:
oneOf:
- type: 'null'
- type: boolean
- type: number
- type: string
- type: array
- type: object
type: object
optimizer_config:
$ref: '#/components/schemas/OptimizerConfig'
training_config:
$ref: '#/components/schemas/TrainingConfig'
validation_dataset:
$ref: '#/components/schemas/TrainEvalDataset'
required:
- job_uuid
- finetuned_model
- dataset
- validation_dataset
- algorithm
- algorithm_config
- optimizer_config
- training_config
- hyperparam_search_config
- logger_config
type: object
QLoraFinetuningConfig:
additionalProperties: false
properties:
alpha:
type: integer
apply_lora_to_mlp:
type: boolean
apply_lora_to_output:
type: boolean
lora_attn_modules:
items:
type: string
type: array
rank:
type: integer
required:
- lora_attn_modules
- apply_lora_to_mlp
- apply_lora_to_output
- rank
- alpha
type: object
QueryDocumentsRequest:
additionalProperties: false
properties:
bank_id:
type: string
params:
additionalProperties:
oneOf:
- type: 'null'
- type: boolean
- type: number
- type: string
- type: array
- type: object
type: object
query:
oneOf:
- type: string
- items:
type: string
type: array
required:
- bank_id
- query
type: object
QueryDocumentsResponse:
additionalProperties: false
properties:
chunks:
items:
additionalProperties: false
properties:
content:
oneOf:
- type: string
- items:
type: string
type: array
document_id:
type: string
token_count:
type: integer
required:
- content
- token_count
- document_id
type: object
type: array
scores:
items:
type: number
type: array
required:
- chunks
- scores
type: object
RLHFAlgorithm:
enum:
- dpo
type: string
RestAPIExecutionConfig:
additionalProperties: false
properties:
body:
additionalProperties:
oneOf:
- type: 'null'
- type: boolean
- type: number
- type: string
- type: array
- type: object
type: object
headers:
additionalProperties:
oneOf:
- type: 'null'
- type: boolean
- type: number
- type: string
- type: array
- type: object
type: object
method:
$ref: '#/components/schemas/RestAPIMethod'
params:
additionalProperties:
oneOf:
- type: 'null'
- type: boolean
- type: number
- type: string
- type: array
- type: object
type: object
url:
$ref: '#/components/schemas/URL'
required:
- url
- method
type: object
RestAPIMethod:
enum:
- GET
- POST
- PUT
- DELETE
type: string
RewardScoreRequest:
additionalProperties: false
properties:
dialog_generations:
items:
$ref: '#/components/schemas/DialogGenerations'
type: array
model:
type: string
required:
- dialog_generations
- model
type: object
RewardScoringResponse:
additionalProperties: false
properties:
scored_generations:
items:
$ref: '#/components/schemas/ScoredDialogGenerations'
type: array
required:
- scored_generations
title: Response from the reward scoring. Batch of (prompt, response, score)
tuples that pass the threshold.
type: object
RunShieldRequest:
additionalProperties: false
properties:
messages:
items:
oneOf:
- $ref: '#/components/schemas/UserMessage'
- $ref: '#/components/schemas/SystemMessage'
- $ref: '#/components/schemas/ToolResponseMessage'
- $ref: '#/components/schemas/CompletionMessage'
type: array
params:
additionalProperties:
oneOf:
- type: 'null'
- type: boolean
- type: number
- type: string
- type: array
- type: object
type: object
shield_type:
type: string
required:
- shield_type
- messages
- params
type: object
RunShieldResponse:
additionalProperties: false
properties:
violation:
$ref: '#/components/schemas/SafetyViolation'
type: object
SafetyViolation:
additionalProperties: false
properties:
metadata:
additionalProperties:
oneOf:
- type: 'null'
- type: boolean
- type: number
- type: string
- type: array
- type: object
type: object
user_message:
type: string
violation_level:
$ref: '#/components/schemas/ViolationLevel'
required:
- violation_level
- metadata
type: object
SamplingParams:
additionalProperties: false
properties:
max_tokens:
default: 0
type: integer
repetition_penalty:
default: 1.0
type: number
strategy:
$ref: '#/components/schemas/SamplingStrategy'
default: greedy
temperature:
default: 0.0
type: number
top_k:
default: 0
type: integer
top_p:
default: 0.95
type: number
required:
- strategy
type: object
SamplingStrategy:
enum:
- greedy
- top_p
- top_k
type: string
ScoredDialogGenerations:
additionalProperties: false
properties:
dialog:
items:
oneOf:
- $ref: '#/components/schemas/UserMessage'
- $ref: '#/components/schemas/SystemMessage'
- $ref: '#/components/schemas/ToolResponseMessage'
- $ref: '#/components/schemas/CompletionMessage'
type: array
scored_generations:
items:
$ref: '#/components/schemas/ScoredMessage'
type: array
required:
- dialog
- scored_generations
type: object
ScoredMessage:
additionalProperties: false
properties:
message:
oneOf:
- $ref: '#/components/schemas/UserMessage'
- $ref: '#/components/schemas/SystemMessage'
- $ref: '#/components/schemas/ToolResponseMessage'
- $ref: '#/components/schemas/CompletionMessage'
score:
type: number
required:
- message
- score
type: object
SearchToolDefinition:
additionalProperties: false
properties:
api_key:
type: string
engine:
default: brave
enum:
- bing
- brave
type: string
input_shields:
items:
type: string
type: array
output_shields:
items:
type: string
type: array
remote_execution:
$ref: '#/components/schemas/RestAPIExecutionConfig'
type:
const: brave_search
default: brave_search
type: string
required:
- type
- api_key
- engine
type: object
Session:
additionalProperties: false
properties:
memory_bank:
$ref: '#/components/schemas/MemoryBank'
session_id:
type: string
session_name:
type: string
started_at:
format: date-time
type: string
turns:
items:
$ref: '#/components/schemas/Turn'
type: array
required:
- session_id
- session_name
- turns
- started_at
title: A single session of an interaction with an Agentic System.
type: object
ShieldCallStep:
additionalProperties: false
properties:
completed_at:
format: date-time
type: string
started_at:
format: date-time
type: string
step_id:
type: string
step_type:
const: shield_call
default: shield_call
type: string
turn_id:
type: string
violation:
$ref: '#/components/schemas/SafetyViolation'
required:
- turn_id
- step_id
- step_type
type: object
ShieldSpec:
additionalProperties: false
properties:
provider_config:
additionalProperties: false
properties:
config:
additionalProperties:
oneOf:
- type: 'null'
- type: boolean
- type: number
- type: string
- type: array
- type: object
type: object
provider_id:
type: string
required:
- provider_id
- config
type: object
shield_type:
type: string
required:
- shield_type
- provider_config
type: object
SpanEndPayload:
additionalProperties: false
properties:
status:
$ref: '#/components/schemas/SpanStatus'
type:
const: span_end
default: span_end
type: string
required:
- type
- status
type: object
SpanStartPayload:
additionalProperties: false
properties:
name:
type: string
parent_span_id:
type: string
type:
const: span_start
default: span_start
type: string
required:
- type
- name
type: object
SpanStatus:
enum:
- ok
- error
type: string
StopReason:
enum:
- end_of_turn
- end_of_message
- out_of_tokens
type: string
StructuredLogEvent:
additionalProperties: false
properties:
attributes:
additionalProperties:
oneOf:
- type: 'null'
- type: boolean
- type: number
- type: string
- type: array
- type: object
type: object
payload:
oneOf:
- $ref: '#/components/schemas/SpanStartPayload'
- $ref: '#/components/schemas/SpanEndPayload'
span_id:
type: string
timestamp:
format: date-time
type: string
trace_id:
type: string
type:
const: structured_log
default: structured_log
type: string
required:
- trace_id
- span_id
- timestamp
- type
- payload
type: object
SupervisedFineTuneRequest:
additionalProperties: false
properties:
algorithm:
$ref: '#/components/schemas/FinetuningAlgorithm'
algorithm_config:
oneOf:
- $ref: '#/components/schemas/LoraFinetuningConfig'
- $ref: '#/components/schemas/QLoraFinetuningConfig'
- $ref: '#/components/schemas/DoraFinetuningConfig'
dataset:
$ref: '#/components/schemas/TrainEvalDataset'
hyperparam_search_config:
additionalProperties:
oneOf:
- type: 'null'
- type: boolean
- type: number
- type: string
- type: array
- type: object
type: object
job_uuid:
type: string
logger_config:
additionalProperties:
oneOf:
- type: 'null'
- type: boolean
- type: number
- type: string
- type: array
- type: object
type: object
model:
type: string
optimizer_config:
$ref: '#/components/schemas/OptimizerConfig'
training_config:
$ref: '#/components/schemas/TrainingConfig'
validation_dataset:
$ref: '#/components/schemas/TrainEvalDataset'
required:
- job_uuid
- model
- dataset
- validation_dataset
- algorithm
- algorithm_config
- optimizer_config
- training_config
- hyperparam_search_config
- logger_config
type: object
SyntheticDataGenerateRequest:
additionalProperties: false
properties:
dialogs:
items:
oneOf:
- $ref: '#/components/schemas/UserMessage'
- $ref: '#/components/schemas/SystemMessage'
- $ref: '#/components/schemas/ToolResponseMessage'
- $ref: '#/components/schemas/CompletionMessage'
type: array
filtering_function:
enum:
- none
- random
- top_k
- top_p
- top_k_top_p
- sigmoid
title: The type of filtering function.
type: string
model:
type: string
required:
- dialogs
- filtering_function
type: object
SyntheticDataGenerationResponse:
additionalProperties: false
properties:
statistics:
additionalProperties:
oneOf:
- type: 'null'
- type: boolean
- type: number
- type: string
- type: array
- type: object
type: object
synthetic_data:
items:
$ref: '#/components/schemas/ScoredDialogGenerations'
type: array
required:
- synthetic_data
title: Response from the synthetic data generation. Batch of (prompt, response,
score) tuples that pass the threshold.
type: object
SystemMessage:
additionalProperties: false
properties:
content:
oneOf:
- type: string
- items:
type: string
type: array
role:
const: system
default: system
type: string
required:
- role
- content
type: object
TokenLogProbs:
additionalProperties: false
properties:
logprobs_by_token:
additionalProperties:
type: number
type: object
required:
- logprobs_by_token
type: object
ToolCall:
additionalProperties: false
properties:
arguments:
additionalProperties:
oneOf:
- type: string
- type: integer
- type: number
- type: boolean
- type: 'null'
- items:
oneOf:
- type: string
- type: integer
- type: number
- type: boolean
- type: 'null'
type: array
- additionalProperties:
oneOf:
- type: string
- type: integer
- type: number
- type: boolean
- type: 'null'
type: object
type: object
call_id:
type: string
tool_name:
oneOf:
- $ref: '#/components/schemas/BuiltinTool'
- type: string
required:
- call_id
- tool_name
- arguments
type: object
ToolCallDelta:
additionalProperties: false
properties:
content:
oneOf:
- type: string
- $ref: '#/components/schemas/ToolCall'
parse_status:
$ref: '#/components/schemas/ToolCallParseStatus'
required:
- content
- parse_status
type: object
ToolCallParseStatus:
enum:
- started
- in_progress
- failure
- success
type: string
ToolChoice:
enum:
- auto
- required
type: string
ToolDefinition:
additionalProperties: false
properties:
description:
type: string
parameters:
additionalProperties:
$ref: '#/components/schemas/ToolParamDefinition'
type: object
tool_name:
oneOf:
- $ref: '#/components/schemas/BuiltinTool'
- type: string
required:
- tool_name
type: object
ToolExecutionStep:
additionalProperties: false
properties:
completed_at:
format: date-time
type: string
started_at:
format: date-time
type: string
step_id:
type: string
step_type:
const: tool_execution
default: tool_execution
type: string
tool_calls:
items:
$ref: '#/components/schemas/ToolCall'
type: array
tool_responses:
items:
$ref: '#/components/schemas/ToolResponse'
type: array
turn_id:
type: string
required:
- turn_id
- step_id
- step_type
- tool_calls
- tool_responses
type: object
ToolParamDefinition:
additionalProperties: false
properties:
description:
type: string
param_type:
type: string
required:
default: true
type: boolean
required:
- param_type
type: object
ToolPromptFormat:
description: "`json` --\n Refers to the json format for calling tools.\n\
\ The json format takes the form like\n {\n \"type\": \"function\"\
,\n \"function\" : {\n \"name\": \"function_name\",\n \
\ \"description\": \"function_description\",\n \"parameters\"\
: {...}\n }\n }\n\n`function_tag` --\n This is an example of\
\ how you could define\n your own user defined format for making tool calls.\n\
\ The function_tag format looks like this,\n <function=function_name>(parameters)</function>\n\
\nThe detailed prompts for each of these formats are added to llama cli"
enum:
- json
- function_tag
title: This Enum refers to the prompt format for calling custom / zero shot
tools
type: string
ToolResponse:
additionalProperties: false
properties:
call_id:
type: string
content:
oneOf:
- type: string
- items:
type: string
type: array
tool_name:
oneOf:
- $ref: '#/components/schemas/BuiltinTool'
- type: string
required:
- call_id
- tool_name
- content
type: object
ToolResponseMessage:
additionalProperties: false
properties:
call_id:
type: string
content:
oneOf:
- type: string
- items:
type: string
type: array
role:
const: ipython
default: ipython
type: string
tool_name:
oneOf:
- $ref: '#/components/schemas/BuiltinTool'
- type: string
required:
- role
- call_id
- tool_name
- content
type: object
Trace:
additionalProperties: false
properties:
end_time:
format: date-time
type: string
root_span_id:
type: string
start_time:
format: date-time
type: string
trace_id:
type: string
required:
- trace_id
- root_span_id
- start_time
type: object
TrainEvalDataset:
additionalProperties: false
properties:
columns:
additionalProperties:
$ref: '#/components/schemas/TrainEvalDatasetColumnType'
type: object
content_url:
$ref: '#/components/schemas/URL'
metadata:
additionalProperties:
oneOf:
- type: 'null'
- type: boolean
- type: number
- type: string
- type: array
- type: object
type: object
required:
- columns
- content_url
title: Dataset to be used for training or evaluating language models.
type: object
TrainEvalDatasetColumnType:
enum:
- dialog
- text
- media
- number
- json
type: string
TrainingConfig:
additionalProperties: false
properties:
batch_size:
type: integer
enable_activation_checkpointing:
type: boolean
fsdp_cpu_offload:
type: boolean
memory_efficient_fsdp_wrap:
type: boolean
n_epochs:
type: integer
n_iters:
type: integer
shuffle:
type: boolean
required:
- n_epochs
- batch_size
- shuffle
- n_iters
- enable_activation_checkpointing
- memory_efficient_fsdp_wrap
- fsdp_cpu_offload
type: object
Turn:
additionalProperties: false
properties:
completed_at:
format: date-time
type: string
input_messages:
items:
oneOf:
- $ref: '#/components/schemas/UserMessage'
- $ref: '#/components/schemas/ToolResponseMessage'
type: array
output_attachments:
items:
$ref: '#/components/schemas/Attachment'
type: array
output_message:
$ref: '#/components/schemas/CompletionMessage'
session_id:
type: string
started_at:
format: date-time
type: string
steps:
items:
oneOf:
- $ref: '#/components/schemas/InferenceStep'
- $ref: '#/components/schemas/ToolExecutionStep'
- $ref: '#/components/schemas/ShieldCallStep'
- $ref: '#/components/schemas/MemoryRetrievalStep'
type: array
turn_id:
type: string
required:
- turn_id
- session_id
- input_messages
- steps
- output_message
- output_attachments
- started_at
title: A single turn in an interaction with an Agentic System.
type: object
URL:
format: uri
pattern: ^(https?://|file://|data:)
type: string
UnstructuredLogEvent:
additionalProperties: false
properties:
attributes:
additionalProperties:
oneOf:
- type: 'null'
- type: boolean
- type: number
- type: string
- type: array
- type: object
type: object
message:
type: string
severity:
$ref: '#/components/schemas/LogSeverity'
span_id:
type: string
timestamp:
format: date-time
type: string
trace_id:
type: string
type:
const: unstructured_log
default: unstructured_log
type: string
required:
- trace_id
- span_id
- timestamp
- type
- message
- severity
type: object
UpdateDocumentsRequest:
additionalProperties: false
properties:
bank_id:
type: string
documents:
items:
$ref: '#/components/schemas/MemoryBankDocument'
type: array
required:
- bank_id
- documents
type: object
UserMessage:
additionalProperties: false
properties:
content:
oneOf:
- type: string
- items:
type: string
type: array
context:
oneOf:
- type: string
- items:
type: string
type: array
role:
const: user
default: user
type: string
required:
- role
- content
type: object
ViolationLevel:
enum:
- info
- warn
- error
type: string
WolframAlphaToolDefinition:
additionalProperties: false
properties:
api_key:
type: string
input_shields:
items:
type: string
type: array
output_shields:
items:
type: string
type: array
remote_execution:
$ref: '#/components/schemas/RestAPIExecutionConfig'
type:
const: wolfram_alpha
default: wolfram_alpha
type: string
required:
- type
- api_key
type: object
info:
description: "This is the specification of the llama stack that provides\n \
\ a set of endpoints and their corresponding interfaces that are tailored\
\ to\n best leverage Llama Models. The specification is still in\
\ draft and subject to change.\n Generated at 2024-09-23 10:56:42.866760"
title: '[DRAFT] Llama Stack Specification'
version: 0.0.1
jsonSchemaDialect: https://json-schema.org/draft/2020-12/schema
openapi: 3.1.0
paths:
/agents/create:
post:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
requestBody:
content:
application/json:
schema:
$ref: '#/components/schemas/CreateAgentRequest'
required: true
responses:
'200':
content:
application/json:
schema:
$ref: '#/components/schemas/AgentCreateResponse'
description: OK
tags:
- Agents
/agents/delete:
post:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
requestBody:
content:
application/json:
schema:
$ref: '#/components/schemas/DeleteAgentsRequest'
required: true
responses:
'200':
description: OK
tags:
- Agents
/agents/session/create:
post:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
requestBody:
content:
application/json:
schema:
$ref: '#/components/schemas/CreateAgentSessionRequest'
required: true
responses:
'200':
content:
application/json:
schema:
$ref: '#/components/schemas/AgentSessionCreateResponse'
description: OK
tags:
- Agents
/agents/session/delete:
post:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
requestBody:
content:
application/json:
schema:
$ref: '#/components/schemas/DeleteAgentsSessionRequest'
required: true
responses:
'200':
description: OK
tags:
- Agents
/agents/session/get:
post:
parameters:
- in: query
name: agent_id
required: true
schema:
type: string
- in: query
name: session_id
required: true
schema:
type: string
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
requestBody:
content:
application/json:
schema:
$ref: '#/components/schemas/GetAgentsSessionRequest'
required: true
responses:
'200':
content:
application/json:
schema:
$ref: '#/components/schemas/Session'
description: OK
tags:
- Agents
/agents/step/get:
get:
parameters:
- in: query
name: agent_id
required: true
schema:
type: string
- in: query
name: turn_id
required: true
schema:
type: string
- in: query
name: step_id
required: true
schema:
type: string
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
responses:
'200':
content:
application/json:
schema:
$ref: '#/components/schemas/AgentStepResponse'
description: OK
tags:
- Agents
/agents/turn/create:
post:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
requestBody:
content:
application/json:
schema:
$ref: '#/components/schemas/CreateAgentTurnRequest'
required: true
responses:
'200':
content:
application/json:
schema:
$ref: '#/components/schemas/AgentTurnResponseStreamChunk'
description: OK
tags:
- Agents
/agents/turn/get:
get:
parameters:
- in: query
name: agent_id
required: true
schema:
type: string
- in: query
name: turn_id
required: true
schema:
type: string
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
responses:
'200':
content:
application/json:
schema:
$ref: '#/components/schemas/Turn'
description: OK
tags:
- Agents
/batch_inference/chat_completion:
post:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
requestBody:
content:
application/json:
schema:
$ref: '#/components/schemas/BatchChatCompletionRequest'
required: true
responses:
'200':
content:
application/json:
schema:
$ref: '#/components/schemas/BatchChatCompletionResponse'
description: OK
tags:
- BatchInference
/batch_inference/completion:
post:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
requestBody:
content:
application/json:
schema:
$ref: '#/components/schemas/BatchCompletionRequest'
required: true
responses:
'200':
content:
application/json:
schema:
$ref: '#/components/schemas/BatchCompletionResponse'
description: OK
tags:
- BatchInference
/datasets/create:
post:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
requestBody:
content:
application/json:
schema:
$ref: '#/components/schemas/CreateDatasetRequest'
required: true
responses:
'200':
description: OK
tags:
- Datasets
/datasets/delete:
post:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
requestBody:
content:
application/json:
schema:
$ref: '#/components/schemas/DeleteDatasetRequest'
required: true
responses:
'200':
description: OK
tags:
- Datasets
/datasets/get:
get:
parameters:
- in: query
name: dataset_uuid
required: true
schema:
type: string
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
responses:
'200':
content:
application/json:
schema:
$ref: '#/components/schemas/TrainEvalDataset'
description: OK
tags:
- Datasets
/evaluate/job/artifacts:
get:
parameters:
- in: query
name: job_uuid
required: true
schema:
type: string
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
responses:
'200':
content:
application/json:
schema:
$ref: '#/components/schemas/EvaluationJobArtifactsResponse'
description: OK
tags:
- Evaluations
/evaluate/job/cancel:
post:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
requestBody:
content:
application/json:
schema:
$ref: '#/components/schemas/CancelEvaluationJobRequest'
required: true
responses:
'200':
description: OK
tags:
- Evaluations
/evaluate/job/logs:
get:
parameters:
- in: query
name: job_uuid
required: true
schema:
type: string
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
responses:
'200':
content:
application/json:
schema:
$ref: '#/components/schemas/EvaluationJobLogStream'
description: OK
tags:
- Evaluations
/evaluate/job/status:
get:
parameters:
- in: query
name: job_uuid
required: true
schema:
type: string
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
responses:
'200':
content:
application/json:
schema:
$ref: '#/components/schemas/EvaluationJobStatusResponse'
description: OK
tags:
- Evaluations
/evaluate/jobs:
get:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
responses:
'200':
content:
application/jsonl:
schema:
$ref: '#/components/schemas/EvaluationJob'
description: OK
tags:
- Evaluations
/evaluate/question_answering/:
post:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
requestBody:
content:
application/json:
schema:
$ref: '#/components/schemas/EvaluateQuestionAnsweringRequest'
required: true
responses:
'200':
content:
application/json:
schema:
$ref: '#/components/schemas/EvaluationJob'
description: OK
tags:
- Evaluations
/evaluate/summarization/:
post:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
requestBody:
content:
application/json:
schema:
$ref: '#/components/schemas/EvaluateSummarizationRequest'
required: true
responses:
'200':
content:
application/json:
schema:
$ref: '#/components/schemas/EvaluationJob'
description: OK
tags:
- Evaluations
/evaluate/text_generation/:
post:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
requestBody:
content:
application/json:
schema:
$ref: '#/components/schemas/EvaluateTextGenerationRequest'
required: true
responses:
'200':
content:
application/json:
schema:
$ref: '#/components/schemas/EvaluationJob'
description: OK
tags:
- Evaluations
/inference/chat_completion:
post:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
requestBody:
content:
application/json:
schema:
$ref: '#/components/schemas/ChatCompletionRequest'
required: true
responses:
'200':
content:
text/event-stream:
schema:
oneOf:
- $ref: '#/components/schemas/ChatCompletionResponse'
- $ref: '#/components/schemas/ChatCompletionResponseStreamChunk'
description: Chat completion response. **OR** SSE-stream of these events.
tags:
- Inference
/inference/completion:
post:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
requestBody:
content:
application/json:
schema:
$ref: '#/components/schemas/CompletionRequest'
required: true
responses:
'200':
content:
application/json:
schema:
oneOf:
- $ref: '#/components/schemas/CompletionResponse'
- $ref: '#/components/schemas/CompletionResponseStreamChunk'
description: Completion response. **OR** streamed completion response.
tags:
- Inference
/inference/embeddings:
post:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
requestBody:
content:
application/json:
schema:
$ref: '#/components/schemas/EmbeddingsRequest'
required: true
responses:
'200':
content:
application/json:
schema:
$ref: '#/components/schemas/EmbeddingsResponse'
description: OK
tags:
- Inference
/memory/create:
post:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
requestBody:
content:
application/json:
schema:
$ref: '#/components/schemas/CreateMemoryBankRequest'
required: true
responses:
'200':
content:
application/json:
schema:
$ref: '#/components/schemas/MemoryBank'
description: OK
tags:
- Memory
/memory/documents/delete:
post:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
requestBody:
content:
application/json:
schema:
$ref: '#/components/schemas/DeleteDocumentsRequest'
required: true
responses:
'200':
description: OK
tags:
- Memory
/memory/documents/get:
post:
parameters:
- in: query
name: bank_id
required: true
schema:
type: string
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
requestBody:
content:
application/json:
schema:
$ref: '#/components/schemas/GetDocumentsRequest'
required: true
responses:
'200':
content:
application/jsonl:
schema:
$ref: '#/components/schemas/MemoryBankDocument'
description: OK
tags:
- Memory
/memory/drop:
post:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
requestBody:
content:
application/json:
schema:
$ref: '#/components/schemas/DropMemoryBankRequest'
required: true
responses:
'200':
content:
application/json:
schema:
type: string
description: OK
tags:
- Memory
/memory/get:
get:
parameters:
- in: query
name: bank_id
required: true
schema:
type: string
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
responses:
'200':
content:
application/json:
schema:
oneOf:
- $ref: '#/components/schemas/MemoryBank'
- type: 'null'
description: OK
tags:
- Memory
/memory/insert:
post:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
requestBody:
content:
application/json:
schema:
$ref: '#/components/schemas/InsertDocumentsRequest'
required: true
responses:
'200':
description: OK
tags:
- Memory
/memory/list:
get:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
responses:
'200':
content:
application/jsonl:
schema:
$ref: '#/components/schemas/MemoryBank'
description: OK
tags:
- Memory
/memory/query:
post:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
requestBody:
content:
application/json:
schema:
$ref: '#/components/schemas/QueryDocumentsRequest'
required: true
responses:
'200':
content:
application/json:
schema:
$ref: '#/components/schemas/QueryDocumentsResponse'
description: OK
tags:
- Memory
/memory/update:
post:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
requestBody:
content:
application/json:
schema:
$ref: '#/components/schemas/UpdateDocumentsRequest'
required: true
responses:
'200':
description: OK
tags:
- Memory
/memory_banks/get:
get:
parameters:
- in: query
name: bank_type
required: true
schema:
$ref: '#/components/schemas/MemoryBankType'
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
responses:
'200':
content:
application/json:
schema:
oneOf:
- $ref: '#/components/schemas/MemoryBankSpec'
- type: 'null'
description: OK
tags:
- MemoryBanks
/memory_banks/list:
get:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
responses:
'200':
content:
application/jsonl:
schema:
$ref: '#/components/schemas/MemoryBankSpec'
description: OK
tags:
- MemoryBanks
/models/get:
get:
parameters:
- in: query
name: core_model_id
required: true
schema:
type: string
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
responses:
'200':
content:
application/json:
schema:
oneOf:
- $ref: '#/components/schemas/ModelServingSpec'
- type: 'null'
description: OK
tags:
- Models
/models/list:
get:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
responses:
'200':
content:
application/jsonl:
schema:
$ref: '#/components/schemas/ModelServingSpec'
description: OK
tags:
- Models
/post_training/job/artifacts:
get:
parameters:
- in: query
name: job_uuid
required: true
schema:
type: string
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
responses:
'200':
content:
application/json:
schema:
$ref: '#/components/schemas/PostTrainingJobArtifactsResponse'
description: OK
tags:
- PostTraining
/post_training/job/cancel:
post:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
requestBody:
content:
application/json:
schema:
$ref: '#/components/schemas/CancelTrainingJobRequest'
required: true
responses:
'200':
description: OK
tags:
- PostTraining
/post_training/job/logs:
get:
parameters:
- in: query
name: job_uuid
required: true
schema:
type: string
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
responses:
'200':
content:
application/json:
schema:
$ref: '#/components/schemas/PostTrainingJobLogStream'
description: OK
tags:
- PostTraining
/post_training/job/status:
get:
parameters:
- in: query
name: job_uuid
required: true
schema:
type: string
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
responses:
'200':
content:
application/json:
schema:
$ref: '#/components/schemas/PostTrainingJobStatusResponse'
description: OK
tags:
- PostTraining
/post_training/jobs:
get:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
responses:
'200':
content:
application/jsonl:
schema:
$ref: '#/components/schemas/PostTrainingJob'
description: OK
tags:
- PostTraining
/post_training/preference_optimize:
post:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
requestBody:
content:
application/json:
schema:
$ref: '#/components/schemas/PreferenceOptimizeRequest'
required: true
responses:
'200':
content:
application/json:
schema:
$ref: '#/components/schemas/PostTrainingJob'
description: OK
tags:
- PostTraining
/post_training/supervised_fine_tune:
post:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
requestBody:
content:
application/json:
schema:
$ref: '#/components/schemas/SupervisedFineTuneRequest'
required: true
responses:
'200':
content:
application/json:
schema:
$ref: '#/components/schemas/PostTrainingJob'
description: OK
tags:
- PostTraining
/reward_scoring/score:
post:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
requestBody:
content:
application/json:
schema:
$ref: '#/components/schemas/RewardScoreRequest'
required: true
responses:
'200':
content:
application/json:
schema:
$ref: '#/components/schemas/RewardScoringResponse'
description: OK
tags:
- RewardScoring
/safety/run_shield:
post:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
requestBody:
content:
application/json:
schema:
$ref: '#/components/schemas/RunShieldRequest'
required: true
responses:
'200':
content:
application/json:
schema:
$ref: '#/components/schemas/RunShieldResponse'
description: OK
tags:
- Safety
/shields/get:
get:
parameters:
- in: query
name: shield_type
required: true
schema:
type: string
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
responses:
'200':
content:
application/json:
schema:
oneOf:
- $ref: '#/components/schemas/ShieldSpec'
- type: 'null'
description: OK
tags:
- Shields
/shields/list:
get:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
responses:
'200':
content:
application/jsonl:
schema:
$ref: '#/components/schemas/ShieldSpec'
description: OK
tags:
- Shields
/synthetic_data_generation/generate:
post:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
requestBody:
content:
application/json:
schema:
$ref: '#/components/schemas/SyntheticDataGenerateRequest'
required: true
responses:
'200':
content:
application/json:
schema:
$ref: '#/components/schemas/SyntheticDataGenerationResponse'
description: OK
tags:
- SyntheticDataGeneration
/telemetry/get_trace:
get:
parameters:
- in: query
name: trace_id
required: true
schema:
type: string
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
responses:
'200':
content:
application/json:
schema:
$ref: '#/components/schemas/Trace'
description: OK
tags:
- Telemetry
/telemetry/log_event:
post:
parameters:
- description: JSON-encoded provider data which will be made available to the
adapter servicing the API
in: header
name: X-LlamaStack-ProviderData
required: false
schema:
type: string
requestBody:
content:
application/json:
schema:
$ref: '#/components/schemas/LogEventRequest'
required: true
responses:
'200':
description: OK
tags:
- Telemetry
security:
- Default: []
servers:
- url: http://any-hosted-llama-stack.com
tags:
- name: Inference
- name: Shields
- name: Models
- name: MemoryBanks
- name: SyntheticDataGeneration
- name: RewardScoring
- name: PostTraining
- name: Safety
- name: Evaluations
- name: Memory
- name: Telemetry
- name: Agents
- name: BatchInference
- name: Datasets
- description: <SchemaDefinition schemaRef="#/components/schemas/BuiltinTool" />
name: BuiltinTool
- description: <SchemaDefinition schemaRef="#/components/schemas/CompletionMessage"
/>
name: CompletionMessage
- description: <SchemaDefinition schemaRef="#/components/schemas/SamplingParams" />
name: SamplingParams
- description: <SchemaDefinition schemaRef="#/components/schemas/SamplingStrategy"
/>
name: SamplingStrategy
- description: <SchemaDefinition schemaRef="#/components/schemas/StopReason" />
name: StopReason
- description: <SchemaDefinition schemaRef="#/components/schemas/SystemMessage" />
name: SystemMessage
- description: <SchemaDefinition schemaRef="#/components/schemas/ToolCall" />
name: ToolCall
- description: <SchemaDefinition schemaRef="#/components/schemas/ToolChoice" />
name: ToolChoice
- description: <SchemaDefinition schemaRef="#/components/schemas/ToolDefinition" />
name: ToolDefinition
- description: <SchemaDefinition schemaRef="#/components/schemas/ToolParamDefinition"
/>
name: ToolParamDefinition
- description: "This Enum refers to the prompt format for calling custom / zero shot\
\ tools\n\n`json` --\n Refers to the json format for calling tools.\n The\
\ json format takes the form like\n {\n \"type\": \"function\",\n \
\ \"function\" : {\n \"name\": \"function_name\",\n \
\ \"description\": \"function_description\",\n \"parameters\": {...}\n\
\ }\n }\n\n`function_tag` --\n This is an example of how you could\
\ define\n your own user defined format for making tool calls.\n The function_tag\
\ format looks like this,\n <function=function_name>(parameters)</function>\n\
\nThe detailed prompts for each of these formats are added to llama cli\n\n<SchemaDefinition\
\ schemaRef=\"#/components/schemas/ToolPromptFormat\" />"
name: ToolPromptFormat
- description: <SchemaDefinition schemaRef="#/components/schemas/ToolResponseMessage"
/>
name: ToolResponseMessage
- description: <SchemaDefinition schemaRef="#/components/schemas/UserMessage" />
name: UserMessage
- description: <SchemaDefinition schemaRef="#/components/schemas/BatchChatCompletionRequest"
/>
name: BatchChatCompletionRequest
- description: <SchemaDefinition schemaRef="#/components/schemas/BatchChatCompletionResponse"
/>
name: BatchChatCompletionResponse
- description: <SchemaDefinition schemaRef="#/components/schemas/BatchCompletionRequest"
/>
name: BatchCompletionRequest
- description: <SchemaDefinition schemaRef="#/components/schemas/BatchCompletionResponse"
/>
name: BatchCompletionResponse
- description: <SchemaDefinition schemaRef="#/components/schemas/CancelEvaluationJobRequest"
/>
name: CancelEvaluationJobRequest
- description: <SchemaDefinition schemaRef="#/components/schemas/CancelTrainingJobRequest"
/>
name: CancelTrainingJobRequest
- description: <SchemaDefinition schemaRef="#/components/schemas/ChatCompletionRequest"
/>
name: ChatCompletionRequest
- description: 'Chat completion response.
<SchemaDefinition schemaRef="#/components/schemas/ChatCompletionResponse" />'
name: ChatCompletionResponse
- description: 'Chat completion response event.
<SchemaDefinition schemaRef="#/components/schemas/ChatCompletionResponseEvent"
/>'
name: ChatCompletionResponseEvent
- description: <SchemaDefinition schemaRef="#/components/schemas/ChatCompletionResponseEventType"
/>
name: ChatCompletionResponseEventType
- description: 'SSE-stream of these events.
<SchemaDefinition schemaRef="#/components/schemas/ChatCompletionResponseStreamChunk"
/>'
name: ChatCompletionResponseStreamChunk
- description: <SchemaDefinition schemaRef="#/components/schemas/TokenLogProbs" />
name: TokenLogProbs
- description: <SchemaDefinition schemaRef="#/components/schemas/ToolCallDelta" />
name: ToolCallDelta
- description: <SchemaDefinition schemaRef="#/components/schemas/ToolCallParseStatus"
/>
name: ToolCallParseStatus
- description: <SchemaDefinition schemaRef="#/components/schemas/CompletionRequest"
/>
name: CompletionRequest
- description: 'Completion response.
<SchemaDefinition schemaRef="#/components/schemas/CompletionResponse" />'
name: CompletionResponse
- description: 'streamed completion response.
<SchemaDefinition schemaRef="#/components/schemas/CompletionResponseStreamChunk"
/>'
name: CompletionResponseStreamChunk
- description: <SchemaDefinition schemaRef="#/components/schemas/AgentConfig" />
name: AgentConfig
- description: <SchemaDefinition schemaRef="#/components/schemas/CodeInterpreterToolDefinition"
/>
name: CodeInterpreterToolDefinition
- description: <SchemaDefinition schemaRef="#/components/schemas/FunctionCallToolDefinition"
/>
name: FunctionCallToolDefinition
- description: <SchemaDefinition schemaRef="#/components/schemas/MemoryToolDefinition"
/>
name: MemoryToolDefinition
- description: <SchemaDefinition schemaRef="#/components/schemas/PhotogenToolDefinition"
/>
name: PhotogenToolDefinition
- description: <SchemaDefinition schemaRef="#/components/schemas/RestAPIExecutionConfig"
/>
name: RestAPIExecutionConfig
- description: <SchemaDefinition schemaRef="#/components/schemas/RestAPIMethod" />
name: RestAPIMethod
- description: <SchemaDefinition schemaRef="#/components/schemas/SearchToolDefinition"
/>
name: SearchToolDefinition
- description: <SchemaDefinition schemaRef="#/components/schemas/URL" />
name: URL
- description: <SchemaDefinition schemaRef="#/components/schemas/WolframAlphaToolDefinition"
/>
name: WolframAlphaToolDefinition
- description: <SchemaDefinition schemaRef="#/components/schemas/CreateAgentRequest"
/>
name: CreateAgentRequest
- description: <SchemaDefinition schemaRef="#/components/schemas/AgentCreateResponse"
/>
name: AgentCreateResponse
- description: <SchemaDefinition schemaRef="#/components/schemas/CreateAgentSessionRequest"
/>
name: CreateAgentSessionRequest
- description: <SchemaDefinition schemaRef="#/components/schemas/AgentSessionCreateResponse"
/>
name: AgentSessionCreateResponse
- description: <SchemaDefinition schemaRef="#/components/schemas/Attachment" />
name: Attachment
- description: <SchemaDefinition schemaRef="#/components/schemas/CreateAgentTurnRequest"
/>
name: CreateAgentTurnRequest
- description: 'Streamed agent execution response.
<SchemaDefinition schemaRef="#/components/schemas/AgentTurnResponseEvent" />'
name: AgentTurnResponseEvent
- description: <SchemaDefinition schemaRef="#/components/schemas/AgentTurnResponseStepCompletePayload"
/>
name: AgentTurnResponseStepCompletePayload
- description: <SchemaDefinition schemaRef="#/components/schemas/AgentTurnResponseStepProgressPayload"
/>
name: AgentTurnResponseStepProgressPayload
- description: <SchemaDefinition schemaRef="#/components/schemas/AgentTurnResponseStepStartPayload"
/>
name: AgentTurnResponseStepStartPayload
- description: <SchemaDefinition schemaRef="#/components/schemas/AgentTurnResponseStreamChunk"
/>
name: AgentTurnResponseStreamChunk
- description: <SchemaDefinition schemaRef="#/components/schemas/AgentTurnResponseTurnCompletePayload"
/>
name: AgentTurnResponseTurnCompletePayload
- description: <SchemaDefinition schemaRef="#/components/schemas/AgentTurnResponseTurnStartPayload"
/>
name: AgentTurnResponseTurnStartPayload
- description: <SchemaDefinition schemaRef="#/components/schemas/InferenceStep" />
name: InferenceStep
- description: <SchemaDefinition schemaRef="#/components/schemas/MemoryRetrievalStep"
/>
name: MemoryRetrievalStep
- description: <SchemaDefinition schemaRef="#/components/schemas/SafetyViolation"
/>
name: SafetyViolation
- description: <SchemaDefinition schemaRef="#/components/schemas/ShieldCallStep" />
name: ShieldCallStep
- description: <SchemaDefinition schemaRef="#/components/schemas/ToolExecutionStep"
/>
name: ToolExecutionStep
- description: <SchemaDefinition schemaRef="#/components/schemas/ToolResponse" />
name: ToolResponse
- description: 'A single turn in an interaction with an Agentic System.
<SchemaDefinition schemaRef="#/components/schemas/Turn" />'
name: Turn
- description: <SchemaDefinition schemaRef="#/components/schemas/ViolationLevel" />
name: ViolationLevel
- description: 'Dataset to be used for training or evaluating language models.
<SchemaDefinition schemaRef="#/components/schemas/TrainEvalDataset" />'
name: TrainEvalDataset
- description: <SchemaDefinition schemaRef="#/components/schemas/TrainEvalDatasetColumnType"
/>
name: TrainEvalDatasetColumnType
- description: <SchemaDefinition schemaRef="#/components/schemas/CreateDatasetRequest"
/>
name: CreateDatasetRequest
- description: <SchemaDefinition schemaRef="#/components/schemas/CreateMemoryBankRequest"
/>
name: CreateMemoryBankRequest
- description: <SchemaDefinition schemaRef="#/components/schemas/MemoryBank" />
name: MemoryBank
- description: <SchemaDefinition schemaRef="#/components/schemas/DeleteAgentsRequest"
/>
name: DeleteAgentsRequest
- description: <SchemaDefinition schemaRef="#/components/schemas/DeleteAgentsSessionRequest"
/>
name: DeleteAgentsSessionRequest
- description: <SchemaDefinition schemaRef="#/components/schemas/DeleteDatasetRequest"
/>
name: DeleteDatasetRequest
- description: <SchemaDefinition schemaRef="#/components/schemas/DeleteDocumentsRequest"
/>
name: DeleteDocumentsRequest
- description: <SchemaDefinition schemaRef="#/components/schemas/DropMemoryBankRequest"
/>
name: DropMemoryBankRequest
- description: <SchemaDefinition schemaRef="#/components/schemas/EmbeddingsRequest"
/>
name: EmbeddingsRequest
- description: <SchemaDefinition schemaRef="#/components/schemas/EmbeddingsResponse"
/>
name: EmbeddingsResponse
- description: <SchemaDefinition schemaRef="#/components/schemas/EvaluateQuestionAnsweringRequest"
/>
name: EvaluateQuestionAnsweringRequest
- description: <SchemaDefinition schemaRef="#/components/schemas/EvaluationJob" />
name: EvaluationJob
- description: <SchemaDefinition schemaRef="#/components/schemas/EvaluateSummarizationRequest"
/>
name: EvaluateSummarizationRequest
- description: <SchemaDefinition schemaRef="#/components/schemas/EvaluateTextGenerationRequest"
/>
name: EvaluateTextGenerationRequest
- description: <SchemaDefinition schemaRef="#/components/schemas/GetAgentsSessionRequest"
/>
name: GetAgentsSessionRequest
- description: 'A single session of an interaction with an Agentic System.
<SchemaDefinition schemaRef="#/components/schemas/Session" />'
name: Session
- description: <SchemaDefinition schemaRef="#/components/schemas/AgentStepResponse"
/>
name: AgentStepResponse
- description: <SchemaDefinition schemaRef="#/components/schemas/GetDocumentsRequest"
/>
name: GetDocumentsRequest
- description: <SchemaDefinition schemaRef="#/components/schemas/MemoryBankDocument"
/>
name: MemoryBankDocument
- description: 'Artifacts of a evaluation job.
<SchemaDefinition schemaRef="#/components/schemas/EvaluationJobArtifactsResponse"
/>'
name: EvaluationJobArtifactsResponse
- description: <SchemaDefinition schemaRef="#/components/schemas/EvaluationJobLogStream"
/>
name: EvaluationJobLogStream
- description: <SchemaDefinition schemaRef="#/components/schemas/EvaluationJobStatusResponse"
/>
name: EvaluationJobStatusResponse
- description: 'The model family and SKU of the model along with other parameters
corresponding to the model.
<SchemaDefinition schemaRef="#/components/schemas/Model" />'
name: Model
- description: <SchemaDefinition schemaRef="#/components/schemas/ModelServingSpec"
/>
name: ModelServingSpec
- description: <SchemaDefinition schemaRef="#/components/schemas/MemoryBankType" />
name: MemoryBankType
- description: <SchemaDefinition schemaRef="#/components/schemas/MemoryBankSpec" />
name: MemoryBankSpec
- description: <SchemaDefinition schemaRef="#/components/schemas/ShieldSpec" />
name: ShieldSpec
- description: <SchemaDefinition schemaRef="#/components/schemas/Trace" />
name: Trace
- description: 'Checkpoint created during training runs
<SchemaDefinition schemaRef="#/components/schemas/Checkpoint" />'
name: Checkpoint
- description: 'Artifacts of a finetuning job.
<SchemaDefinition schemaRef="#/components/schemas/PostTrainingJobArtifactsResponse"
/>'
name: PostTrainingJobArtifactsResponse
- description: 'Stream of logs from a finetuning job.
<SchemaDefinition schemaRef="#/components/schemas/PostTrainingJobLogStream" />'
name: PostTrainingJobLogStream
- description: <SchemaDefinition schemaRef="#/components/schemas/PostTrainingJobStatus"
/>
name: PostTrainingJobStatus
- description: 'Status of a finetuning job.
<SchemaDefinition schemaRef="#/components/schemas/PostTrainingJobStatusResponse"
/>'
name: PostTrainingJobStatusResponse
- description: <SchemaDefinition schemaRef="#/components/schemas/PostTrainingJob"
/>
name: PostTrainingJob
- description: <SchemaDefinition schemaRef="#/components/schemas/InsertDocumentsRequest"
/>
name: InsertDocumentsRequest
- description: <SchemaDefinition schemaRef="#/components/schemas/LogSeverity" />
name: LogSeverity
- description: <SchemaDefinition schemaRef="#/components/schemas/MetricEvent" />
name: MetricEvent
- description: <SchemaDefinition schemaRef="#/components/schemas/SpanEndPayload" />
name: SpanEndPayload
- description: <SchemaDefinition schemaRef="#/components/schemas/SpanStartPayload"
/>
name: SpanStartPayload
- description: <SchemaDefinition schemaRef="#/components/schemas/SpanStatus" />
name: SpanStatus
- description: <SchemaDefinition schemaRef="#/components/schemas/StructuredLogEvent"
/>
name: StructuredLogEvent
- description: <SchemaDefinition schemaRef="#/components/schemas/UnstructuredLogEvent"
/>
name: UnstructuredLogEvent
- description: <SchemaDefinition schemaRef="#/components/schemas/LogEventRequest"
/>
name: LogEventRequest
- description: <SchemaDefinition schemaRef="#/components/schemas/DPOAlignmentConfig"
/>
name: DPOAlignmentConfig
- description: <SchemaDefinition schemaRef="#/components/schemas/OptimizerConfig"
/>
name: OptimizerConfig
- description: <SchemaDefinition schemaRef="#/components/schemas/RLHFAlgorithm" />
name: RLHFAlgorithm
- description: <SchemaDefinition schemaRef="#/components/schemas/TrainingConfig" />
name: TrainingConfig
- description: <SchemaDefinition schemaRef="#/components/schemas/PreferenceOptimizeRequest"
/>
name: PreferenceOptimizeRequest
- description: <SchemaDefinition schemaRef="#/components/schemas/QueryDocumentsRequest"
/>
name: QueryDocumentsRequest
- description: <SchemaDefinition schemaRef="#/components/schemas/QueryDocumentsResponse"
/>
name: QueryDocumentsResponse
- description: <SchemaDefinition schemaRef="#/components/schemas/DialogGenerations"
/>
name: DialogGenerations
- description: <SchemaDefinition schemaRef="#/components/schemas/RewardScoreRequest"
/>
name: RewardScoreRequest
- description: 'Response from the reward scoring. Batch of (prompt, response, score)
tuples that pass the threshold.
<SchemaDefinition schemaRef="#/components/schemas/RewardScoringResponse" />'
name: RewardScoringResponse
- description: <SchemaDefinition schemaRef="#/components/schemas/ScoredDialogGenerations"
/>
name: ScoredDialogGenerations
- description: <SchemaDefinition schemaRef="#/components/schemas/ScoredMessage" />
name: ScoredMessage
- description: <SchemaDefinition schemaRef="#/components/schemas/RunShieldRequest"
/>
name: RunShieldRequest
- description: <SchemaDefinition schemaRef="#/components/schemas/RunShieldResponse"
/>
name: RunShieldResponse
- description: <SchemaDefinition schemaRef="#/components/schemas/DoraFinetuningConfig"
/>
name: DoraFinetuningConfig
- description: <SchemaDefinition schemaRef="#/components/schemas/FinetuningAlgorithm"
/>
name: FinetuningAlgorithm
- description: <SchemaDefinition schemaRef="#/components/schemas/LoraFinetuningConfig"
/>
name: LoraFinetuningConfig
- description: <SchemaDefinition schemaRef="#/components/schemas/QLoraFinetuningConfig"
/>
name: QLoraFinetuningConfig
- description: <SchemaDefinition schemaRef="#/components/schemas/SupervisedFineTuneRequest"
/>
name: SupervisedFineTuneRequest
- description: <SchemaDefinition schemaRef="#/components/schemas/SyntheticDataGenerateRequest"
/>
name: SyntheticDataGenerateRequest
- description: 'Response from the synthetic data generation. Batch of (prompt, response,
score) tuples that pass the threshold.
<SchemaDefinition schemaRef="#/components/schemas/SyntheticDataGenerationResponse"
/>'
name: SyntheticDataGenerationResponse
- description: <SchemaDefinition schemaRef="#/components/schemas/UpdateDocumentsRequest"
/>
name: UpdateDocumentsRequest
x-tagGroups:
- name: Operations
tags:
- Agents
- BatchInference
- Datasets
- Evaluations
- Inference
- Memory
- MemoryBanks
- Models
- PostTraining
- RewardScoring
- Safety
- Shields
- SyntheticDataGeneration
- Telemetry
- name: Types
tags:
- AgentConfig
- AgentCreateResponse
- AgentSessionCreateResponse
- AgentStepResponse
- AgentTurnResponseEvent
- AgentTurnResponseStepCompletePayload
- AgentTurnResponseStepProgressPayload
- AgentTurnResponseStepStartPayload
- AgentTurnResponseStreamChunk
- AgentTurnResponseTurnCompletePayload
- AgentTurnResponseTurnStartPayload
- Attachment
- BatchChatCompletionRequest
- BatchChatCompletionResponse
- BatchCompletionRequest
- BatchCompletionResponse
- BuiltinTool
- CancelEvaluationJobRequest
- CancelTrainingJobRequest
- ChatCompletionRequest
- ChatCompletionResponse
- ChatCompletionResponseEvent
- ChatCompletionResponseEventType
- ChatCompletionResponseStreamChunk
- Checkpoint
- CodeInterpreterToolDefinition
- CompletionMessage
- CompletionRequest
- CompletionResponse
- CompletionResponseStreamChunk
- CreateAgentRequest
- CreateAgentSessionRequest
- CreateAgentTurnRequest
- CreateDatasetRequest
- CreateMemoryBankRequest
- DPOAlignmentConfig
- DeleteAgentsRequest
- DeleteAgentsSessionRequest
- DeleteDatasetRequest
- DeleteDocumentsRequest
- DialogGenerations
- DoraFinetuningConfig
- DropMemoryBankRequest
- EmbeddingsRequest
- EmbeddingsResponse
- EvaluateQuestionAnsweringRequest
- EvaluateSummarizationRequest
- EvaluateTextGenerationRequest
- EvaluationJob
- EvaluationJobArtifactsResponse
- EvaluationJobLogStream
- EvaluationJobStatusResponse
- FinetuningAlgorithm
- FunctionCallToolDefinition
- GetAgentsSessionRequest
- GetDocumentsRequest
- InferenceStep
- InsertDocumentsRequest
- LogEventRequest
- LogSeverity
- LoraFinetuningConfig
- MemoryBank
- MemoryBankDocument
- MemoryBankSpec
- MemoryBankType
- MemoryRetrievalStep
- MemoryToolDefinition
- MetricEvent
- Model
- ModelServingSpec
- OptimizerConfig
- PhotogenToolDefinition
- PostTrainingJob
- PostTrainingJobArtifactsResponse
- PostTrainingJobLogStream
- PostTrainingJobStatus
- PostTrainingJobStatusResponse
- PreferenceOptimizeRequest
- QLoraFinetuningConfig
- QueryDocumentsRequest
- QueryDocumentsResponse
- RLHFAlgorithm
- RestAPIExecutionConfig
- RestAPIMethod
- RewardScoreRequest
- RewardScoringResponse
- RunShieldRequest
- RunShieldResponse
- SafetyViolation
- SamplingParams
- SamplingStrategy
- ScoredDialogGenerations
- ScoredMessage
- SearchToolDefinition
- Session
- ShieldCallStep
- ShieldSpec
- SpanEndPayload
- SpanStartPayload
- SpanStatus
- StopReason
- StructuredLogEvent
- SupervisedFineTuneRequest
- SyntheticDataGenerateRequest
- SyntheticDataGenerationResponse
- SystemMessage
- TokenLogProbs
- ToolCall
- ToolCallDelta
- ToolCallParseStatus
- ToolChoice
- ToolDefinition
- ToolExecutionStep
- ToolParamDefinition
- ToolPromptFormat
- ToolResponse
- ToolResponseMessage
- Trace
- TrainEvalDataset
- TrainEvalDatasetColumnType
- TrainingConfig
- Turn
- URL
- UnstructuredLogEvent
- UpdateDocumentsRequest
- UserMessage
- ViolationLevel
- WolframAlphaToolDefinition