mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-07-14 17:16:09 +00:00
811 lines
22 KiB
YAML
811 lines
22 KiB
YAML
components:
|
|
responses: {}
|
|
schemas:
|
|
AgenticSystemCreateRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
available_tools:
|
|
items:
|
|
oneOf:
|
|
- enum:
|
|
- web_search
|
|
- math
|
|
- image_gen
|
|
- code_interpreter
|
|
title: Builtin tools are tools the model is natively aware of and was
|
|
potentially fine-tuned with.
|
|
type: string
|
|
- additionalProperties: false
|
|
properties:
|
|
parameters:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
tool_name:
|
|
type: string
|
|
required:
|
|
- tool_name
|
|
- parameters
|
|
type: object
|
|
type: array
|
|
executable_tools:
|
|
items:
|
|
type: string
|
|
type: array
|
|
uniqueItems: true
|
|
instructions:
|
|
type: string
|
|
model:
|
|
enum:
|
|
- llama3_8b_chat
|
|
- llama3_70b_chat
|
|
type: string
|
|
required:
|
|
- instructions
|
|
- model
|
|
- available_tools
|
|
- executable_tools
|
|
type: object
|
|
AgenticSystemCreateResponse:
|
|
additionalProperties: false
|
|
properties:
|
|
agent_id:
|
|
type: string
|
|
required:
|
|
- agent_id
|
|
type: object
|
|
AgenticSystemExecuteRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
agent_id:
|
|
type: string
|
|
messages:
|
|
items:
|
|
$ref: '#/components/schemas/Message'
|
|
type: array
|
|
stream:
|
|
default: false
|
|
type: boolean
|
|
turn_history:
|
|
items:
|
|
$ref: '#/components/schemas/AgenticSystemTurn'
|
|
type: array
|
|
required:
|
|
- agent_id
|
|
- messages
|
|
- turn_history
|
|
- stream
|
|
type: object
|
|
AgenticSystemExecuteResponse:
|
|
additionalProperties: false
|
|
properties:
|
|
turn:
|
|
$ref: '#/components/schemas/AgenticSystemTurn'
|
|
required:
|
|
- turn
|
|
title: non-stream response from the agentic system.
|
|
type: object
|
|
AgenticSystemExecuteResponseStreamChunk:
|
|
additionalProperties: false
|
|
properties:
|
|
stop_reason:
|
|
enum:
|
|
- not_stopped
|
|
- finished_ok
|
|
- max_tokens
|
|
title: Stop reasons are used to indicate why the model stopped generating
|
|
text.
|
|
type: string
|
|
turn:
|
|
$ref: '#/components/schemas/AgenticSystemTurn'
|
|
required:
|
|
- turn
|
|
title: Streamed agent execution response.
|
|
type: object
|
|
AgenticSystemTurn:
|
|
additionalProperties: false
|
|
properties:
|
|
response_message:
|
|
$ref: '#/components/schemas/Message'
|
|
steps:
|
|
items:
|
|
oneOf:
|
|
- additionalProperties: false
|
|
properties:
|
|
logprobs:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
step_type:
|
|
default: model_inference
|
|
enum:
|
|
- model_inference
|
|
- tool_execution
|
|
- safety_filtering
|
|
- memory_retrieval
|
|
title: The type of execution step.
|
|
type: string
|
|
text:
|
|
type: string
|
|
required:
|
|
- step_type
|
|
- text
|
|
type: object
|
|
- additionalProperties: false
|
|
properties:
|
|
step_type:
|
|
default: tool_execution
|
|
enum:
|
|
- model_inference
|
|
- tool_execution
|
|
- safety_filtering
|
|
- memory_retrieval
|
|
title: The type of execution step.
|
|
type: string
|
|
tool_calls:
|
|
items:
|
|
additionalProperties: false
|
|
properties:
|
|
arguments:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
tool_name:
|
|
type: string
|
|
required:
|
|
- tool_name
|
|
- arguments
|
|
title: A tool call is a request to a tool.
|
|
type: object
|
|
type: array
|
|
tool_responses:
|
|
items:
|
|
additionalProperties: false
|
|
properties:
|
|
response:
|
|
type: string
|
|
tool_name:
|
|
type: string
|
|
required:
|
|
- tool_name
|
|
- response
|
|
type: object
|
|
type: array
|
|
required:
|
|
- step_type
|
|
- tool_calls
|
|
- tool_responses
|
|
type: object
|
|
- additionalProperties: false
|
|
properties:
|
|
step_type:
|
|
default: safety_filtering
|
|
enum:
|
|
- model_inference
|
|
- tool_execution
|
|
- safety_filtering
|
|
- memory_retrieval
|
|
title: The type of execution step.
|
|
type: string
|
|
violation:
|
|
additionalProperties: false
|
|
properties:
|
|
details:
|
|
type: string
|
|
suggested_user_response:
|
|
type: string
|
|
violation_type:
|
|
type: string
|
|
required:
|
|
- violation_type
|
|
- details
|
|
type: object
|
|
required:
|
|
- step_type
|
|
type: object
|
|
- additionalProperties: false
|
|
properties:
|
|
documents:
|
|
items:
|
|
type: string
|
|
type: array
|
|
scores:
|
|
items:
|
|
type: number
|
|
type: array
|
|
step_type:
|
|
default: memory_retrieval
|
|
enum:
|
|
- model_inference
|
|
- tool_execution
|
|
- safety_filtering
|
|
- memory_retrieval
|
|
title: The type of execution step.
|
|
type: string
|
|
required:
|
|
- step_type
|
|
- documents
|
|
- scores
|
|
type: object
|
|
type: array
|
|
user_messages:
|
|
items:
|
|
$ref: '#/components/schemas/Message'
|
|
type: array
|
|
required:
|
|
- user_messages
|
|
- steps
|
|
- response_message
|
|
title: A single turn in an interaction with an Agentic System.
|
|
type: object
|
|
Attachment:
|
|
additionalProperties: false
|
|
properties:
|
|
mime_type:
|
|
type: string
|
|
url:
|
|
$ref: '#/components/schemas/URL'
|
|
required:
|
|
- url
|
|
- mime_type
|
|
title: Attachments are used to refer to external resources, such as images,
|
|
videos, audio, etc.
|
|
type: object
|
|
ChatCompletionRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
available_tools:
|
|
items:
|
|
oneOf:
|
|
- enum:
|
|
- web_search
|
|
- math
|
|
- image_gen
|
|
- code_interpreter
|
|
title: Builtin tools are tools the model is natively aware of and was
|
|
potentially fine-tuned with.
|
|
type: string
|
|
- additionalProperties: false
|
|
properties:
|
|
parameters:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
tool_name:
|
|
type: string
|
|
required:
|
|
- tool_name
|
|
- parameters
|
|
type: object
|
|
type: array
|
|
logprobs:
|
|
default: false
|
|
type: boolean
|
|
max_tokens:
|
|
default: 0
|
|
type: integer
|
|
message:
|
|
$ref: '#/components/schemas/Message'
|
|
message_history:
|
|
items:
|
|
$ref: '#/components/schemas/Message'
|
|
type: array
|
|
model:
|
|
enum:
|
|
- llama3_8b_chat
|
|
- llama3_70b_chat
|
|
type: string
|
|
sampling_params:
|
|
additionalProperties: false
|
|
properties:
|
|
strategy:
|
|
default: greedy
|
|
type: string
|
|
temperature:
|
|
default: 0.0
|
|
type: number
|
|
top_k:
|
|
default: 0
|
|
type: integer
|
|
top_p:
|
|
default: 0.95
|
|
type: number
|
|
required:
|
|
- temperature
|
|
- strategy
|
|
- top_p
|
|
- top_k
|
|
type: object
|
|
stream:
|
|
default: false
|
|
type: boolean
|
|
required:
|
|
- message
|
|
- model
|
|
- message_history
|
|
- sampling_params
|
|
- available_tools
|
|
- max_tokens
|
|
- stream
|
|
- logprobs
|
|
type: object
|
|
ChatCompletionResponse:
|
|
additionalProperties: false
|
|
properties:
|
|
content:
|
|
oneOf:
|
|
- type: string
|
|
- $ref: '#/components/schemas/Attachment'
|
|
- items:
|
|
oneOf:
|
|
- type: string
|
|
- $ref: '#/components/schemas/Attachment'
|
|
type: array
|
|
logprobs:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
stop_reason:
|
|
enum:
|
|
- not_stopped
|
|
- finished_ok
|
|
- max_tokens
|
|
title: Stop reasons are used to indicate why the model stopped generating
|
|
text.
|
|
type: string
|
|
tool_calls:
|
|
items:
|
|
additionalProperties: false
|
|
properties:
|
|
arguments:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
tool_name:
|
|
type: string
|
|
required:
|
|
- tool_name
|
|
- arguments
|
|
title: A tool call is a request to a tool.
|
|
type: object
|
|
type: array
|
|
required:
|
|
- content
|
|
- tool_calls
|
|
title: Normal chat completion response.
|
|
type: object
|
|
ChatCompletionResponseStreamChunk:
|
|
additionalProperties: false
|
|
properties:
|
|
stop_reason:
|
|
enum:
|
|
- not_stopped
|
|
- finished_ok
|
|
- max_tokens
|
|
title: Stop reasons are used to indicate why the model stopped generating
|
|
text.
|
|
type: string
|
|
text_delta:
|
|
type: string
|
|
tool_call:
|
|
additionalProperties: false
|
|
properties:
|
|
arguments:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
tool_name:
|
|
type: string
|
|
required:
|
|
- tool_name
|
|
- arguments
|
|
title: A tool call is a request to a tool.
|
|
type: object
|
|
required:
|
|
- text_delta
|
|
title: Streamed chat completion response. The actual response is a series of
|
|
such objects.
|
|
type: object
|
|
CompletionRequest:
|
|
additionalProperties: false
|
|
properties:
|
|
content:
|
|
oneOf:
|
|
- type: string
|
|
- $ref: '#/components/schemas/Attachment'
|
|
- items:
|
|
oneOf:
|
|
- type: string
|
|
- $ref: '#/components/schemas/Attachment'
|
|
type: array
|
|
logprobs:
|
|
default: false
|
|
type: boolean
|
|
max_tokens:
|
|
default: 0
|
|
type: integer
|
|
model:
|
|
enum:
|
|
- llama3_8b
|
|
- llama3_70b
|
|
type: string
|
|
sampling_params:
|
|
additionalProperties: false
|
|
properties:
|
|
strategy:
|
|
default: greedy
|
|
type: string
|
|
temperature:
|
|
default: 0.0
|
|
type: number
|
|
top_k:
|
|
default: 0
|
|
type: integer
|
|
top_p:
|
|
default: 0.95
|
|
type: number
|
|
required:
|
|
- temperature
|
|
- strategy
|
|
- top_p
|
|
- top_k
|
|
type: object
|
|
stream:
|
|
default: false
|
|
type: boolean
|
|
required:
|
|
- content
|
|
- model
|
|
- sampling_params
|
|
- max_tokens
|
|
- stream
|
|
- logprobs
|
|
type: object
|
|
CompletionResponse:
|
|
additionalProperties: false
|
|
properties:
|
|
content:
|
|
oneOf:
|
|
- type: string
|
|
- $ref: '#/components/schemas/Attachment'
|
|
- items:
|
|
oneOf:
|
|
- type: string
|
|
- $ref: '#/components/schemas/Attachment'
|
|
type: array
|
|
logprobs:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
stop_reason:
|
|
enum:
|
|
- not_stopped
|
|
- finished_ok
|
|
- max_tokens
|
|
title: Stop reasons are used to indicate why the model stopped generating
|
|
text.
|
|
type: string
|
|
required:
|
|
- content
|
|
title: Normal completion response.
|
|
type: object
|
|
CompletionResponseStreamChunk:
|
|
additionalProperties: false
|
|
properties:
|
|
logprobs:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
stop_reason:
|
|
enum:
|
|
- not_stopped
|
|
- finished_ok
|
|
- max_tokens
|
|
title: Stop reasons are used to indicate why the model stopped generating
|
|
text.
|
|
type: string
|
|
text_delta:
|
|
type: string
|
|
required:
|
|
- text_delta
|
|
title: streamed completion response.
|
|
type: object
|
|
Message:
|
|
additionalProperties: false
|
|
properties:
|
|
content:
|
|
oneOf:
|
|
- type: string
|
|
- $ref: '#/components/schemas/Attachment'
|
|
- items:
|
|
oneOf:
|
|
- type: string
|
|
- $ref: '#/components/schemas/Attachment'
|
|
type: array
|
|
role:
|
|
enum:
|
|
- system
|
|
- user
|
|
- assistant
|
|
- tool
|
|
type: string
|
|
tool_calls:
|
|
items:
|
|
additionalProperties: false
|
|
properties:
|
|
arguments:
|
|
additionalProperties:
|
|
oneOf:
|
|
- type: 'null'
|
|
- type: boolean
|
|
- type: number
|
|
- type: string
|
|
- type: array
|
|
- type: object
|
|
type: object
|
|
tool_name:
|
|
type: string
|
|
required:
|
|
- tool_name
|
|
- arguments
|
|
title: A tool call is a request to a tool.
|
|
type: object
|
|
type: array
|
|
tool_responses:
|
|
items:
|
|
additionalProperties: false
|
|
properties:
|
|
response:
|
|
type: string
|
|
tool_name:
|
|
type: string
|
|
required:
|
|
- tool_name
|
|
- response
|
|
type: object
|
|
type: array
|
|
required:
|
|
- role
|
|
- content
|
|
- tool_calls
|
|
- tool_responses
|
|
type: object
|
|
URL:
|
|
format: uri
|
|
pattern: ^(https?://|file://|data:)
|
|
type: string
|
|
info:
|
|
description: This is the llama stack
|
|
title: Llama Stack specification
|
|
version: '0.1'
|
|
jsonSchemaDialect: https://json-schema.org/draft/2020-12/schema
|
|
openapi: 3.1.0
|
|
paths:
|
|
/agentic_system/create:
|
|
post:
|
|
parameters: []
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/AgenticSystemCreateRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/AgenticSystemCreateResponse'
|
|
description: OK
|
|
tags:
|
|
- AgenticSystem
|
|
/agentic_system/execute:
|
|
post:
|
|
parameters: []
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/AgenticSystemExecuteRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/AgenticSystemExecuteResponse'
|
|
- $ref: '#/components/schemas/AgenticSystemExecuteResponseStreamChunk'
|
|
description: non-stream response from the agentic system. **OR** Streamed
|
|
agent execution response.
|
|
tags:
|
|
- AgenticSystem
|
|
/chat_completion:
|
|
post:
|
|
parameters: []
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/ChatCompletionRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/ChatCompletionResponse'
|
|
- $ref: '#/components/schemas/ChatCompletionResponseStreamChunk'
|
|
description: Normal chat completion response. **OR** Streamed chat completion
|
|
response. The actual response is a series of such objects.
|
|
tags:
|
|
- Inference
|
|
/completion:
|
|
post:
|
|
parameters: []
|
|
requestBody:
|
|
content:
|
|
application/json:
|
|
schema:
|
|
$ref: '#/components/schemas/CompletionRequest'
|
|
required: true
|
|
responses:
|
|
'200':
|
|
content:
|
|
application/json:
|
|
schema:
|
|
oneOf:
|
|
- $ref: '#/components/schemas/CompletionResponse'
|
|
- $ref: '#/components/schemas/CompletionResponseStreamChunk'
|
|
description: Normal completion response. **OR** streamed completion response.
|
|
tags:
|
|
- Inference
|
|
security:
|
|
- Default: []
|
|
servers:
|
|
- url: http://llama.meta.com
|
|
tags:
|
|
- name: Inference
|
|
- name: AgenticSystem
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/AgenticSystemCreateRequest"
|
|
/>
|
|
name: AgenticSystemCreateRequest
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/AgenticSystemCreateResponse"
|
|
/>
|
|
name: AgenticSystemCreateResponse
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/AgenticSystemExecuteRequest"
|
|
/>
|
|
name: AgenticSystemExecuteRequest
|
|
- description: 'A single turn in an interaction with an Agentic System.
|
|
|
|
|
|
<SchemaDefinition schemaRef="#/components/schemas/AgenticSystemTurn" />'
|
|
name: AgenticSystemTurn
|
|
- description: 'Attachments are used to refer to external resources, such as images,
|
|
videos, audio, etc.
|
|
|
|
|
|
<SchemaDefinition schemaRef="#/components/schemas/Attachment" />'
|
|
name: Attachment
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/Message" />
|
|
name: Message
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/URL" />
|
|
name: URL
|
|
- description: 'non-stream response from the agentic system.
|
|
|
|
|
|
<SchemaDefinition schemaRef="#/components/schemas/AgenticSystemExecuteResponse"
|
|
/>'
|
|
name: AgenticSystemExecuteResponse
|
|
- description: 'Streamed agent execution response.
|
|
|
|
|
|
<SchemaDefinition schemaRef="#/components/schemas/AgenticSystemExecuteResponseStreamChunk"
|
|
/>'
|
|
name: AgenticSystemExecuteResponseStreamChunk
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ChatCompletionRequest"
|
|
/>
|
|
name: ChatCompletionRequest
|
|
- description: 'Normal chat completion response.
|
|
|
|
|
|
<SchemaDefinition schemaRef="#/components/schemas/ChatCompletionResponse" />'
|
|
name: ChatCompletionResponse
|
|
- description: 'Streamed chat completion response. The actual response is a series
|
|
of such objects.
|
|
|
|
|
|
<SchemaDefinition schemaRef="#/components/schemas/ChatCompletionResponseStreamChunk"
|
|
/>'
|
|
name: ChatCompletionResponseStreamChunk
|
|
- description: <SchemaDefinition schemaRef="#/components/schemas/CompletionRequest"
|
|
/>
|
|
name: CompletionRequest
|
|
- description: 'Normal completion response.
|
|
|
|
|
|
<SchemaDefinition schemaRef="#/components/schemas/CompletionResponse" />'
|
|
name: CompletionResponse
|
|
- description: 'streamed completion response.
|
|
|
|
|
|
<SchemaDefinition schemaRef="#/components/schemas/CompletionResponseStreamChunk"
|
|
/>'
|
|
name: CompletionResponseStreamChunk
|
|
x-tagGroups:
|
|
- name: Operations
|
|
tags:
|
|
- AgenticSystem
|
|
- Inference
|
|
- name: Types
|
|
tags:
|
|
- AgenticSystemCreateRequest
|
|
- AgenticSystemCreateResponse
|
|
- AgenticSystemExecuteRequest
|
|
- AgenticSystemExecuteResponse
|
|
- AgenticSystemExecuteResponseStreamChunk
|
|
- AgenticSystemTurn
|
|
- Attachment
|
|
- ChatCompletionRequest
|
|
- ChatCompletionResponse
|
|
- ChatCompletionResponseStreamChunk
|
|
- CompletionRequest
|
|
- CompletionResponse
|
|
- CompletionResponseStreamChunk
|
|
- Message
|
|
- URL
|