mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-07-03 12:52:41 +00:00
more definitions
This commit is contained in:
parent
722d20c6de
commit
6e4586ba7a
3 changed files with 775 additions and 178 deletions
165
source/defn.py
165
source/defn.py
|
@ -1,6 +1,6 @@
|
||||||
from dataclasses import dataclass, field
|
from dataclasses import dataclass, field
|
||||||
from enum import Enum
|
from enum import Enum
|
||||||
from typing import Any, Dict, List, Optional, Protocol, Union
|
from typing import Any, Dict, List, Optional, Protocol, Set, Union
|
||||||
|
|
||||||
import yaml
|
import yaml
|
||||||
|
|
||||||
|
@ -45,16 +45,6 @@ class Role(Enum):
|
||||||
tool = "tool"
|
tool = "tool"
|
||||||
|
|
||||||
|
|
||||||
class StopReason(Enum):
|
|
||||||
"""
|
|
||||||
Stop reasons are used to indicate why the model stopped generating text.
|
|
||||||
"""
|
|
||||||
|
|
||||||
not_stopped = "not_stopped"
|
|
||||||
finished_ok = "finished_ok"
|
|
||||||
max_tokens = "max_tokens"
|
|
||||||
|
|
||||||
|
|
||||||
@dataclass
|
@dataclass
|
||||||
class ToolCall:
|
class ToolCall:
|
||||||
"""
|
"""
|
||||||
|
@ -77,6 +67,28 @@ class ToolDefinition:
|
||||||
parameters: Dict[str, Any]
|
parameters: Dict[str, Any]
|
||||||
|
|
||||||
|
|
||||||
|
# TODO: we need to document the parameters for the tool calls
|
||||||
|
class BuiltinTool(Enum):
|
||||||
|
"""
|
||||||
|
Builtin tools are tools the model is natively aware of and was potentially fine-tuned with.
|
||||||
|
"""
|
||||||
|
|
||||||
|
web_search = "web_search"
|
||||||
|
math = "math"
|
||||||
|
image_gen = "image_gen"
|
||||||
|
code_interpreter = "code_interpreter"
|
||||||
|
|
||||||
|
|
||||||
|
class StopReason(Enum):
|
||||||
|
"""
|
||||||
|
Stop reasons are used to indicate why the model stopped generating text.
|
||||||
|
"""
|
||||||
|
|
||||||
|
not_stopped = "not_stopped"
|
||||||
|
finished_ok = "finished_ok"
|
||||||
|
max_tokens = "max_tokens"
|
||||||
|
|
||||||
|
|
||||||
@json_schema_type
|
@json_schema_type
|
||||||
@dataclass
|
@dataclass
|
||||||
class Message:
|
class Message:
|
||||||
|
@ -85,9 +97,6 @@ class Message:
|
||||||
# input to the model or output from the model
|
# input to the model or output from the model
|
||||||
content: Content
|
content: Content
|
||||||
|
|
||||||
# zero-shot tool definitions as input to the model
|
|
||||||
tool_definitions: List[ToolDefinition] = field(default_factory=list)
|
|
||||||
|
|
||||||
# output from the model
|
# output from the model
|
||||||
tool_calls: List[ToolCall] = field(default_factory=list)
|
tool_calls: List[ToolCall] = field(default_factory=list)
|
||||||
|
|
||||||
|
@ -95,45 +104,6 @@ class Message:
|
||||||
tool_responses: List[ToolResponse] = field(default_factory=list)
|
tool_responses: List[ToolResponse] = field(default_factory=list)
|
||||||
|
|
||||||
|
|
||||||
@json_schema_type
|
|
||||||
@dataclass
|
|
||||||
class CompletionResponse:
|
|
||||||
"""Normal completion response."""
|
|
||||||
content: Content
|
|
||||||
stop_reason: StopReason
|
|
||||||
logprobs: Optional[Dict[str, Any]] = None
|
|
||||||
|
|
||||||
|
|
||||||
@json_schema_type
|
|
||||||
@dataclass
|
|
||||||
class StreamedCompletionResponse:
|
|
||||||
"""streamed completion response."""
|
|
||||||
text_delta: str
|
|
||||||
stop_reason: StopReason
|
|
||||||
logprobs: Optional[Dict[str, Any]] = None
|
|
||||||
|
|
||||||
|
|
||||||
@json_schema_type
|
|
||||||
@dataclass
|
|
||||||
class ChatCompletionResponse:
|
|
||||||
"""Normal chat completion response."""
|
|
||||||
|
|
||||||
content: Content
|
|
||||||
stop_reason: StopReason
|
|
||||||
tool_calls: List[ToolCall] = field(default_factory=list)
|
|
||||||
logprobs: Optional[Dict[str, Any]] = None
|
|
||||||
|
|
||||||
|
|
||||||
@json_schema_type
|
|
||||||
@dataclass
|
|
||||||
class StreamedChatCompletionResponse:
|
|
||||||
"""Streamed chat completion response."""
|
|
||||||
|
|
||||||
text_delta: str
|
|
||||||
stop_reason: StopReason
|
|
||||||
tool_call: Optional[ToolCall] = None
|
|
||||||
|
|
||||||
|
|
||||||
@dataclass
|
@dataclass
|
||||||
class SamplingParams:
|
class SamplingParams:
|
||||||
temperature: float = 0.0
|
temperature: float = 0.0
|
||||||
|
@ -165,16 +135,69 @@ class CompletionRequest:
|
||||||
|
|
||||||
@json_schema_type
|
@json_schema_type
|
||||||
@dataclass
|
@dataclass
|
||||||
class ChatCompletionRequest:
|
class CompletionResponse:
|
||||||
|
"""Normal completion response."""
|
||||||
|
|
||||||
|
content: Content
|
||||||
|
stop_reason: Optional[StopReason] = None
|
||||||
|
logprobs: Optional[Dict[str, Any]] = None
|
||||||
|
|
||||||
|
|
||||||
|
@json_schema_type
|
||||||
|
@dataclass
|
||||||
|
class StreamedCompletionResponse:
|
||||||
|
"""streamed completion response."""
|
||||||
|
|
||||||
|
text_delta: str
|
||||||
|
stop_reason: Optional[StopReason] = None
|
||||||
|
logprobs: Optional[Dict[str, Any]] = None
|
||||||
|
|
||||||
|
|
||||||
|
@dataclass
|
||||||
|
class ChatCompletionRequestCommon:
|
||||||
message: Message
|
message: Message
|
||||||
message_history: List[Message] = None
|
message_history: List[Message] = None
|
||||||
model: InstructModel = InstructModel.llama3_8b_chat
|
model: InstructModel = InstructModel.llama3_8b_chat
|
||||||
sampling_params: SamplingParams = SamplingParams()
|
sampling_params: SamplingParams = SamplingParams()
|
||||||
|
|
||||||
|
# zero-shot tool definitions as input to the model
|
||||||
|
available_tools: List[Union[BuiltinTool, ToolDefinition]] = field(
|
||||||
|
default_factory=list
|
||||||
|
)
|
||||||
|
|
||||||
|
|
||||||
|
@json_schema_type
|
||||||
|
@dataclass
|
||||||
|
class ChatCompletionRequest(ChatCompletionRequestCommon):
|
||||||
max_tokens: int = 0
|
max_tokens: int = 0
|
||||||
stream: bool = False
|
stream: bool = False
|
||||||
logprobs: bool = False
|
logprobs: bool = False
|
||||||
|
|
||||||
|
|
||||||
|
@json_schema_type
|
||||||
|
@dataclass
|
||||||
|
class ChatCompletionResponse:
|
||||||
|
"""Normal chat completion response."""
|
||||||
|
|
||||||
|
content: Content
|
||||||
|
|
||||||
|
# note: multiple tool calls can be generated in a single response
|
||||||
|
tool_calls: List[ToolCall] = field(default_factory=list)
|
||||||
|
|
||||||
|
stop_reason: Optional[StopReason] = None
|
||||||
|
logprobs: Optional[Dict[str, Any]] = None
|
||||||
|
|
||||||
|
|
||||||
|
@json_schema_type
|
||||||
|
@dataclass
|
||||||
|
class StreamedChatCompletionResponse:
|
||||||
|
"""Streamed chat completion response."""
|
||||||
|
|
||||||
|
text_delta: str
|
||||||
|
stop_reason: Optional[StopReason] = None
|
||||||
|
tool_call: Optional[ToolCall] = None
|
||||||
|
|
||||||
|
|
||||||
class Inference(Protocol):
|
class Inference(Protocol):
|
||||||
|
|
||||||
def post_completion(
|
def post_completion(
|
||||||
|
@ -188,19 +211,41 @@ class Inference(Protocol):
|
||||||
) -> Union[ChatCompletionResponse, StreamedChatCompletionResponse]: ...
|
) -> Union[ChatCompletionResponse, StreamedChatCompletionResponse]: ...
|
||||||
|
|
||||||
|
|
||||||
|
@json_schema_type
|
||||||
|
@dataclass
|
||||||
|
class AgenticSystemExecuteRequest(ChatCompletionRequestCommon):
|
||||||
|
executable_tools: Set[str] = field(default_factory=set)
|
||||||
|
stream: bool = False
|
||||||
|
|
||||||
|
|
||||||
@json_schema_type
|
@json_schema_type
|
||||||
@dataclass
|
@dataclass
|
||||||
class AgenticSystemExecuteRequest:
|
class AgenticSystemExecuteResponse:
|
||||||
message: Message
|
"""Normal chat completion response."""
|
||||||
message_history: List[Message] = None
|
|
||||||
model: InstructModel = InstructModel.llama3_8b_chat
|
content: Content
|
||||||
sampling_params: SamplingParams = SamplingParams()
|
stop_reason: StopReason
|
||||||
|
tool_calls: List[ToolCall] = field(default_factory=list)
|
||||||
|
logprobs: Optional[Dict[str, Any]] = None
|
||||||
|
|
||||||
|
|
||||||
|
@json_schema_type
|
||||||
|
@dataclass
|
||||||
|
class StreamedAgenticSystemExecuteResponse:
|
||||||
|
"""Streamed chat completion response."""
|
||||||
|
|
||||||
|
text_delta: str
|
||||||
|
stop_reason: StopReason
|
||||||
|
tool_call: Optional[ToolCall] = None
|
||||||
|
|
||||||
|
|
||||||
class AgenticSystem(Protocol):
|
class AgenticSystem(Protocol):
|
||||||
|
|
||||||
@webmethod(route="/agentic/system/execute")
|
@webmethod(route="/agentic/system/execute")
|
||||||
def create_agentic_system_execute(self,) -> str: ...
|
def create_agentic_system_execute(
|
||||||
|
self,
|
||||||
|
request: AgenticSystemExecuteRequest,
|
||||||
|
) -> Union[AgenticSystemExecuteResponse, StreamedAgenticSystemExecuteResponse]: ...
|
||||||
|
|
||||||
|
|
||||||
class Endpoint(Inference, AgenticSystem): ...
|
class Endpoint(Inference, AgenticSystem): ...
|
||||||
|
|
|
@ -30,14 +30,21 @@
|
||||||
],
|
],
|
||||||
"paths": {
|
"paths": {
|
||||||
"/agentic/system/execute": {
|
"/agentic/system/execute": {
|
||||||
"get": {
|
"post": {
|
||||||
"responses": {
|
"responses": {
|
||||||
"200": {
|
"200": {
|
||||||
"description": "OK",
|
"description": "Normal chat completion response. **OR** Streamed chat completion response.",
|
||||||
"content": {
|
"content": {
|
||||||
"application/json": {
|
"application/json": {
|
||||||
"schema": {
|
"schema": {
|
||||||
"type": "string"
|
"oneOf": [
|
||||||
|
{
|
||||||
|
"$ref": "#/components/schemas/AgenticSystemExecuteResponse"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"$ref": "#/components/schemas/StreamedAgenticSystemExecuteResponse"
|
||||||
|
}
|
||||||
|
]
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -46,7 +53,17 @@
|
||||||
"tags": [
|
"tags": [
|
||||||
"AgenticSystem"
|
"AgenticSystem"
|
||||||
],
|
],
|
||||||
"parameters": []
|
"parameters": [],
|
||||||
|
"requestBody": {
|
||||||
|
"content": {
|
||||||
|
"application/json": {
|
||||||
|
"schema": {
|
||||||
|
"$ref": "#/components/schemas/AgenticSystemExecuteRequest"
|
||||||
|
}
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"required": true
|
||||||
|
}
|
||||||
}
|
}
|
||||||
},
|
},
|
||||||
"/chat_completion": {
|
"/chat_completion": {
|
||||||
|
@ -127,24 +144,7 @@
|
||||||
"jsonSchemaDialect": "https://json-schema.org/draft/2020-12/schema",
|
"jsonSchemaDialect": "https://json-schema.org/draft/2020-12/schema",
|
||||||
"components": {
|
"components": {
|
||||||
"schemas": {
|
"schemas": {
|
||||||
"Attachment": {
|
"AgenticSystemExecuteRequest": {
|
||||||
"type": "object",
|
|
||||||
"properties": {
|
|
||||||
"url": {
|
|
||||||
"$ref": "#/components/schemas/URL"
|
|
||||||
},
|
|
||||||
"mime_type": {
|
|
||||||
"type": "string"
|
|
||||||
}
|
|
||||||
},
|
|
||||||
"additionalProperties": false,
|
|
||||||
"required": [
|
|
||||||
"url",
|
|
||||||
"mime_type"
|
|
||||||
],
|
|
||||||
"title": "Attachments are used to refer to external resources, such as images, videos, audio, etc."
|
|
||||||
},
|
|
||||||
"ChatCompletionRequest": {
|
|
||||||
"type": "object",
|
"type": "object",
|
||||||
"properties": {
|
"properties": {
|
||||||
"message": {
|
"message": {
|
||||||
|
@ -192,68 +192,21 @@
|
||||||
"top_k"
|
"top_k"
|
||||||
]
|
]
|
||||||
},
|
},
|
||||||
"max_tokens": {
|
"available_tools": {
|
||||||
"type": "integer",
|
"type": "array",
|
||||||
"default": 0
|
"items": {
|
||||||
},
|
"oneOf": [
|
||||||
"stream": {
|
{
|
||||||
"type": "boolean",
|
|
||||||
"default": false
|
|
||||||
},
|
|
||||||
"logprobs": {
|
|
||||||
"type": "boolean",
|
|
||||||
"default": false
|
|
||||||
}
|
|
||||||
},
|
|
||||||
"additionalProperties": false,
|
|
||||||
"required": [
|
|
||||||
"message",
|
|
||||||
"message_history",
|
|
||||||
"model",
|
|
||||||
"sampling_params",
|
|
||||||
"max_tokens",
|
|
||||||
"stream",
|
|
||||||
"logprobs"
|
|
||||||
]
|
|
||||||
},
|
|
||||||
"Message": {
|
|
||||||
"type": "object",
|
|
||||||
"properties": {
|
|
||||||
"role": {
|
|
||||||
"type": "string",
|
"type": "string",
|
||||||
"enum": [
|
"enum": [
|
||||||
"system",
|
"web_search",
|
||||||
"user",
|
"math",
|
||||||
"assistant",
|
"image_gen",
|
||||||
"tool"
|
"code_interpreter"
|
||||||
]
|
],
|
||||||
},
|
"title": "Builtin tools are tools the model is natively aware of and was potentially fine-tuned with."
|
||||||
"content": {
|
|
||||||
"oneOf": [
|
|
||||||
{
|
|
||||||
"type": "string"
|
|
||||||
},
|
},
|
||||||
{
|
{
|
||||||
"$ref": "#/components/schemas/Attachment"
|
|
||||||
},
|
|
||||||
{
|
|
||||||
"type": "array",
|
|
||||||
"items": {
|
|
||||||
"oneOf": [
|
|
||||||
{
|
|
||||||
"type": "string"
|
|
||||||
},
|
|
||||||
{
|
|
||||||
"$ref": "#/components/schemas/Attachment"
|
|
||||||
}
|
|
||||||
]
|
|
||||||
}
|
|
||||||
}
|
|
||||||
]
|
|
||||||
},
|
|
||||||
"tool_definitions": {
|
|
||||||
"type": "array",
|
|
||||||
"items": {
|
|
||||||
"type": "object",
|
"type": "object",
|
||||||
"properties": {
|
"properties": {
|
||||||
"tool_name": {
|
"tool_name": {
|
||||||
|
@ -291,6 +244,83 @@
|
||||||
"parameters"
|
"parameters"
|
||||||
]
|
]
|
||||||
}
|
}
|
||||||
|
]
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"executable_tools": {
|
||||||
|
"type": "array",
|
||||||
|
"items": {
|
||||||
|
"type": "string"
|
||||||
|
},
|
||||||
|
"uniqueItems": true
|
||||||
|
},
|
||||||
|
"stream": {
|
||||||
|
"type": "boolean",
|
||||||
|
"default": false
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"additionalProperties": false,
|
||||||
|
"required": [
|
||||||
|
"message",
|
||||||
|
"message_history",
|
||||||
|
"model",
|
||||||
|
"sampling_params",
|
||||||
|
"available_tools",
|
||||||
|
"executable_tools",
|
||||||
|
"stream"
|
||||||
|
]
|
||||||
|
},
|
||||||
|
"Attachment": {
|
||||||
|
"type": "object",
|
||||||
|
"properties": {
|
||||||
|
"url": {
|
||||||
|
"$ref": "#/components/schemas/URL"
|
||||||
|
},
|
||||||
|
"mime_type": {
|
||||||
|
"type": "string"
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"additionalProperties": false,
|
||||||
|
"required": [
|
||||||
|
"url",
|
||||||
|
"mime_type"
|
||||||
|
],
|
||||||
|
"title": "Attachments are used to refer to external resources, such as images, videos, audio, etc."
|
||||||
|
},
|
||||||
|
"Message": {
|
||||||
|
"type": "object",
|
||||||
|
"properties": {
|
||||||
|
"role": {
|
||||||
|
"type": "string",
|
||||||
|
"enum": [
|
||||||
|
"system",
|
||||||
|
"user",
|
||||||
|
"assistant",
|
||||||
|
"tool"
|
||||||
|
]
|
||||||
|
},
|
||||||
|
"content": {
|
||||||
|
"oneOf": [
|
||||||
|
{
|
||||||
|
"type": "string"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"$ref": "#/components/schemas/Attachment"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"type": "array",
|
||||||
|
"items": {
|
||||||
|
"oneOf": [
|
||||||
|
{
|
||||||
|
"type": "string"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"$ref": "#/components/schemas/Attachment"
|
||||||
|
}
|
||||||
|
]
|
||||||
|
}
|
||||||
|
}
|
||||||
|
]
|
||||||
},
|
},
|
||||||
"tool_calls": {
|
"tool_calls": {
|
||||||
"type": "array",
|
"type": "array",
|
||||||
|
@ -358,7 +388,6 @@
|
||||||
"required": [
|
"required": [
|
||||||
"role",
|
"role",
|
||||||
"content",
|
"content",
|
||||||
"tool_definitions",
|
|
||||||
"tool_calls",
|
"tool_calls",
|
||||||
"tool_responses"
|
"tool_responses"
|
||||||
]
|
]
|
||||||
|
@ -368,7 +397,7 @@
|
||||||
"format": "uri",
|
"format": "uri",
|
||||||
"pattern": "^(https?://|file://|data:)"
|
"pattern": "^(https?://|file://|data:)"
|
||||||
},
|
},
|
||||||
"ChatCompletionResponse": {
|
"AgenticSystemExecuteResponse": {
|
||||||
"type": "object",
|
"type": "object",
|
||||||
"properties": {
|
"properties": {
|
||||||
"content": {
|
"content": {
|
||||||
|
@ -479,7 +508,7 @@
|
||||||
],
|
],
|
||||||
"title": "Normal chat completion response."
|
"title": "Normal chat completion response."
|
||||||
},
|
},
|
||||||
"StreamedChatCompletionResponse": {
|
"StreamedAgenticSystemExecuteResponse": {
|
||||||
"type": "object",
|
"type": "object",
|
||||||
"properties": {
|
"properties": {
|
||||||
"text_delta": {
|
"text_delta": {
|
||||||
|
@ -541,6 +570,305 @@
|
||||||
],
|
],
|
||||||
"title": "Streamed chat completion response."
|
"title": "Streamed chat completion response."
|
||||||
},
|
},
|
||||||
|
"ChatCompletionRequest": {
|
||||||
|
"type": "object",
|
||||||
|
"properties": {
|
||||||
|
"message": {
|
||||||
|
"$ref": "#/components/schemas/Message"
|
||||||
|
},
|
||||||
|
"message_history": {
|
||||||
|
"type": "array",
|
||||||
|
"items": {
|
||||||
|
"$ref": "#/components/schemas/Message"
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"model": {
|
||||||
|
"type": "string",
|
||||||
|
"enum": [
|
||||||
|
"llama3_8b_chat",
|
||||||
|
"llama3_70b_chat"
|
||||||
|
],
|
||||||
|
"default": "llama3_8b_chat"
|
||||||
|
},
|
||||||
|
"sampling_params": {
|
||||||
|
"type": "object",
|
||||||
|
"properties": {
|
||||||
|
"temperature": {
|
||||||
|
"type": "number",
|
||||||
|
"default": 0.0
|
||||||
|
},
|
||||||
|
"strategy": {
|
||||||
|
"type": "string",
|
||||||
|
"default": "greedy"
|
||||||
|
},
|
||||||
|
"top_p": {
|
||||||
|
"type": "number",
|
||||||
|
"default": 0.95
|
||||||
|
},
|
||||||
|
"top_k": {
|
||||||
|
"type": "integer",
|
||||||
|
"default": 0
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"additionalProperties": false,
|
||||||
|
"required": [
|
||||||
|
"temperature",
|
||||||
|
"strategy",
|
||||||
|
"top_p",
|
||||||
|
"top_k"
|
||||||
|
]
|
||||||
|
},
|
||||||
|
"available_tools": {
|
||||||
|
"type": "array",
|
||||||
|
"items": {
|
||||||
|
"oneOf": [
|
||||||
|
{
|
||||||
|
"type": "string",
|
||||||
|
"enum": [
|
||||||
|
"web_search",
|
||||||
|
"math",
|
||||||
|
"image_gen",
|
||||||
|
"code_interpreter"
|
||||||
|
],
|
||||||
|
"title": "Builtin tools are tools the model is natively aware of and was potentially fine-tuned with."
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"type": "object",
|
||||||
|
"properties": {
|
||||||
|
"tool_name": {
|
||||||
|
"type": "string"
|
||||||
|
},
|
||||||
|
"parameters": {
|
||||||
|
"type": "object",
|
||||||
|
"additionalProperties": {
|
||||||
|
"oneOf": [
|
||||||
|
{
|
||||||
|
"type": "null"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"type": "boolean"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"type": "number"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"type": "string"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"type": "array"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"type": "object"
|
||||||
|
}
|
||||||
|
]
|
||||||
|
}
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"additionalProperties": false,
|
||||||
|
"required": [
|
||||||
|
"tool_name",
|
||||||
|
"parameters"
|
||||||
|
]
|
||||||
|
}
|
||||||
|
]
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"max_tokens": {
|
||||||
|
"type": "integer",
|
||||||
|
"default": 0
|
||||||
|
},
|
||||||
|
"stream": {
|
||||||
|
"type": "boolean",
|
||||||
|
"default": false
|
||||||
|
},
|
||||||
|
"logprobs": {
|
||||||
|
"type": "boolean",
|
||||||
|
"default": false
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"additionalProperties": false,
|
||||||
|
"required": [
|
||||||
|
"message",
|
||||||
|
"message_history",
|
||||||
|
"model",
|
||||||
|
"sampling_params",
|
||||||
|
"available_tools",
|
||||||
|
"max_tokens",
|
||||||
|
"stream",
|
||||||
|
"logprobs"
|
||||||
|
]
|
||||||
|
},
|
||||||
|
"ChatCompletionResponse": {
|
||||||
|
"type": "object",
|
||||||
|
"properties": {
|
||||||
|
"content": {
|
||||||
|
"oneOf": [
|
||||||
|
{
|
||||||
|
"type": "string"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"$ref": "#/components/schemas/Attachment"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"type": "array",
|
||||||
|
"items": {
|
||||||
|
"oneOf": [
|
||||||
|
{
|
||||||
|
"type": "string"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"$ref": "#/components/schemas/Attachment"
|
||||||
|
}
|
||||||
|
]
|
||||||
|
}
|
||||||
|
}
|
||||||
|
]
|
||||||
|
},
|
||||||
|
"tool_calls": {
|
||||||
|
"type": "array",
|
||||||
|
"items": {
|
||||||
|
"type": "object",
|
||||||
|
"properties": {
|
||||||
|
"tool_name": {
|
||||||
|
"type": "string"
|
||||||
|
},
|
||||||
|
"arguments": {
|
||||||
|
"type": "object",
|
||||||
|
"additionalProperties": {
|
||||||
|
"oneOf": [
|
||||||
|
{
|
||||||
|
"type": "null"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"type": "boolean"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"type": "number"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"type": "string"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"type": "array"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"type": "object"
|
||||||
|
}
|
||||||
|
]
|
||||||
|
}
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"additionalProperties": false,
|
||||||
|
"required": [
|
||||||
|
"tool_name",
|
||||||
|
"arguments"
|
||||||
|
],
|
||||||
|
"title": "A tool call is a request to a tool."
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"stop_reason": {
|
||||||
|
"type": "string",
|
||||||
|
"enum": [
|
||||||
|
"not_stopped",
|
||||||
|
"finished_ok",
|
||||||
|
"max_tokens"
|
||||||
|
],
|
||||||
|
"title": "Stop reasons are used to indicate why the model stopped generating text."
|
||||||
|
},
|
||||||
|
"logprobs": {
|
||||||
|
"type": "object",
|
||||||
|
"additionalProperties": {
|
||||||
|
"oneOf": [
|
||||||
|
{
|
||||||
|
"type": "null"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"type": "boolean"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"type": "number"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"type": "string"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"type": "array"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"type": "object"
|
||||||
|
}
|
||||||
|
]
|
||||||
|
}
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"additionalProperties": false,
|
||||||
|
"required": [
|
||||||
|
"content",
|
||||||
|
"tool_calls"
|
||||||
|
],
|
||||||
|
"title": "Normal chat completion response."
|
||||||
|
},
|
||||||
|
"StreamedChatCompletionResponse": {
|
||||||
|
"type": "object",
|
||||||
|
"properties": {
|
||||||
|
"text_delta": {
|
||||||
|
"type": "string"
|
||||||
|
},
|
||||||
|
"stop_reason": {
|
||||||
|
"type": "string",
|
||||||
|
"enum": [
|
||||||
|
"not_stopped",
|
||||||
|
"finished_ok",
|
||||||
|
"max_tokens"
|
||||||
|
],
|
||||||
|
"title": "Stop reasons are used to indicate why the model stopped generating text."
|
||||||
|
},
|
||||||
|
"tool_call": {
|
||||||
|
"type": "object",
|
||||||
|
"properties": {
|
||||||
|
"tool_name": {
|
||||||
|
"type": "string"
|
||||||
|
},
|
||||||
|
"arguments": {
|
||||||
|
"type": "object",
|
||||||
|
"additionalProperties": {
|
||||||
|
"oneOf": [
|
||||||
|
{
|
||||||
|
"type": "null"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"type": "boolean"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"type": "number"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"type": "string"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"type": "array"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"type": "object"
|
||||||
|
}
|
||||||
|
]
|
||||||
|
}
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"additionalProperties": false,
|
||||||
|
"required": [
|
||||||
|
"tool_name",
|
||||||
|
"arguments"
|
||||||
|
],
|
||||||
|
"title": "A tool call is a request to a tool."
|
||||||
|
}
|
||||||
|
},
|
||||||
|
"additionalProperties": false,
|
||||||
|
"required": [
|
||||||
|
"text_delta"
|
||||||
|
],
|
||||||
|
"title": "Streamed chat completion response."
|
||||||
|
},
|
||||||
"CompletionRequest": {
|
"CompletionRequest": {
|
||||||
"type": "object",
|
"type": "object",
|
||||||
"properties": {
|
"properties": {
|
||||||
|
@ -689,8 +1017,7 @@
|
||||||
},
|
},
|
||||||
"additionalProperties": false,
|
"additionalProperties": false,
|
||||||
"required": [
|
"required": [
|
||||||
"content",
|
"content"
|
||||||
"stop_reason"
|
|
||||||
],
|
],
|
||||||
"title": "Normal completion response."
|
"title": "Normal completion response."
|
||||||
},
|
},
|
||||||
|
@ -737,8 +1064,7 @@
|
||||||
},
|
},
|
||||||
"additionalProperties": false,
|
"additionalProperties": false,
|
||||||
"required": [
|
"required": [
|
||||||
"text_delta",
|
"text_delta"
|
||||||
"stop_reason"
|
|
||||||
],
|
],
|
||||||
"title": "streamed completion response."
|
"title": "streamed completion response."
|
||||||
}
|
}
|
||||||
|
@ -751,20 +1077,20 @@
|
||||||
}
|
}
|
||||||
],
|
],
|
||||||
"tags": [
|
"tags": [
|
||||||
|
{
|
||||||
|
"name": "Inference"
|
||||||
|
},
|
||||||
{
|
{
|
||||||
"name": "AgenticSystem"
|
"name": "AgenticSystem"
|
||||||
},
|
},
|
||||||
{
|
{
|
||||||
"name": "Inference"
|
"name": "AgenticSystemExecuteRequest",
|
||||||
|
"description": "<SchemaDefinition schemaRef=\"#/components/schemas/AgenticSystemExecuteRequest\" />"
|
||||||
},
|
},
|
||||||
{
|
{
|
||||||
"name": "Attachment",
|
"name": "Attachment",
|
||||||
"description": "Attachments are used to refer to external resources, such as images, videos, audio, etc.\n\n<SchemaDefinition schemaRef=\"#/components/schemas/Attachment\" />"
|
"description": "Attachments are used to refer to external resources, such as images, videos, audio, etc.\n\n<SchemaDefinition schemaRef=\"#/components/schemas/Attachment\" />"
|
||||||
},
|
},
|
||||||
{
|
|
||||||
"name": "ChatCompletionRequest",
|
|
||||||
"description": "<SchemaDefinition schemaRef=\"#/components/schemas/ChatCompletionRequest\" />"
|
|
||||||
},
|
|
||||||
{
|
{
|
||||||
"name": "Message",
|
"name": "Message",
|
||||||
"description": "<SchemaDefinition schemaRef=\"#/components/schemas/Message\" />"
|
"description": "<SchemaDefinition schemaRef=\"#/components/schemas/Message\" />"
|
||||||
|
@ -773,6 +1099,18 @@
|
||||||
"name": "URL",
|
"name": "URL",
|
||||||
"description": "<SchemaDefinition schemaRef=\"#/components/schemas/URL\" />"
|
"description": "<SchemaDefinition schemaRef=\"#/components/schemas/URL\" />"
|
||||||
},
|
},
|
||||||
|
{
|
||||||
|
"name": "AgenticSystemExecuteResponse",
|
||||||
|
"description": "Normal chat completion response.\n\n<SchemaDefinition schemaRef=\"#/components/schemas/AgenticSystemExecuteResponse\" />"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "StreamedAgenticSystemExecuteResponse",
|
||||||
|
"description": "Streamed chat completion response.\n\n<SchemaDefinition schemaRef=\"#/components/schemas/StreamedAgenticSystemExecuteResponse\" />"
|
||||||
|
},
|
||||||
|
{
|
||||||
|
"name": "ChatCompletionRequest",
|
||||||
|
"description": "<SchemaDefinition schemaRef=\"#/components/schemas/ChatCompletionRequest\" />"
|
||||||
|
},
|
||||||
{
|
{
|
||||||
"name": "ChatCompletionResponse",
|
"name": "ChatCompletionResponse",
|
||||||
"description": "Normal chat completion response.\n\n<SchemaDefinition schemaRef=\"#/components/schemas/ChatCompletionResponse\" />"
|
"description": "Normal chat completion response.\n\n<SchemaDefinition schemaRef=\"#/components/schemas/ChatCompletionResponse\" />"
|
||||||
|
@ -805,12 +1143,15 @@
|
||||||
{
|
{
|
||||||
"name": "Types",
|
"name": "Types",
|
||||||
"tags": [
|
"tags": [
|
||||||
|
"AgenticSystemExecuteRequest",
|
||||||
|
"AgenticSystemExecuteResponse",
|
||||||
"Attachment",
|
"Attachment",
|
||||||
"ChatCompletionRequest",
|
"ChatCompletionRequest",
|
||||||
"ChatCompletionResponse",
|
"ChatCompletionResponse",
|
||||||
"CompletionRequest",
|
"CompletionRequest",
|
||||||
"CompletionResponse",
|
"CompletionResponse",
|
||||||
"Message",
|
"Message",
|
||||||
|
"StreamedAgenticSystemExecuteResponse",
|
||||||
"StreamedChatCompletionResponse",
|
"StreamedChatCompletionResponse",
|
||||||
"StreamedCompletionResponse",
|
"StreamedCompletionResponse",
|
||||||
"URL"
|
"URL"
|
||||||
|
|
|
@ -1,6 +1,147 @@
|
||||||
components:
|
components:
|
||||||
responses: {}
|
responses: {}
|
||||||
schemas:
|
schemas:
|
||||||
|
AgenticSystemExecuteRequest:
|
||||||
|
additionalProperties: false
|
||||||
|
properties:
|
||||||
|
available_tools:
|
||||||
|
items:
|
||||||
|
oneOf:
|
||||||
|
- enum:
|
||||||
|
- web_search
|
||||||
|
- math
|
||||||
|
- image_gen
|
||||||
|
- code_interpreter
|
||||||
|
title: Builtin tools are tools the model is natively aware of and was
|
||||||
|
potentially fine-tuned with.
|
||||||
|
type: string
|
||||||
|
- additionalProperties: false
|
||||||
|
properties:
|
||||||
|
parameters:
|
||||||
|
additionalProperties:
|
||||||
|
oneOf:
|
||||||
|
- type: 'null'
|
||||||
|
- type: boolean
|
||||||
|
- type: number
|
||||||
|
- type: string
|
||||||
|
- type: array
|
||||||
|
- type: object
|
||||||
|
type: object
|
||||||
|
tool_name:
|
||||||
|
type: string
|
||||||
|
required:
|
||||||
|
- tool_name
|
||||||
|
- parameters
|
||||||
|
type: object
|
||||||
|
type: array
|
||||||
|
executable_tools:
|
||||||
|
items:
|
||||||
|
type: string
|
||||||
|
type: array
|
||||||
|
uniqueItems: true
|
||||||
|
message:
|
||||||
|
$ref: '#/components/schemas/Message'
|
||||||
|
message_history:
|
||||||
|
items:
|
||||||
|
$ref: '#/components/schemas/Message'
|
||||||
|
type: array
|
||||||
|
model:
|
||||||
|
default: llama3_8b_chat
|
||||||
|
enum:
|
||||||
|
- llama3_8b_chat
|
||||||
|
- llama3_70b_chat
|
||||||
|
type: string
|
||||||
|
sampling_params:
|
||||||
|
additionalProperties: false
|
||||||
|
properties:
|
||||||
|
strategy:
|
||||||
|
default: greedy
|
||||||
|
type: string
|
||||||
|
temperature:
|
||||||
|
default: 0.0
|
||||||
|
type: number
|
||||||
|
top_k:
|
||||||
|
default: 0
|
||||||
|
type: integer
|
||||||
|
top_p:
|
||||||
|
default: 0.95
|
||||||
|
type: number
|
||||||
|
required:
|
||||||
|
- temperature
|
||||||
|
- strategy
|
||||||
|
- top_p
|
||||||
|
- top_k
|
||||||
|
type: object
|
||||||
|
stream:
|
||||||
|
default: false
|
||||||
|
type: boolean
|
||||||
|
required:
|
||||||
|
- message
|
||||||
|
- message_history
|
||||||
|
- model
|
||||||
|
- sampling_params
|
||||||
|
- available_tools
|
||||||
|
- executable_tools
|
||||||
|
- stream
|
||||||
|
type: object
|
||||||
|
AgenticSystemExecuteResponse:
|
||||||
|
additionalProperties: false
|
||||||
|
properties:
|
||||||
|
content:
|
||||||
|
oneOf:
|
||||||
|
- type: string
|
||||||
|
- $ref: '#/components/schemas/Attachment'
|
||||||
|
- items:
|
||||||
|
oneOf:
|
||||||
|
- type: string
|
||||||
|
- $ref: '#/components/schemas/Attachment'
|
||||||
|
type: array
|
||||||
|
logprobs:
|
||||||
|
additionalProperties:
|
||||||
|
oneOf:
|
||||||
|
- type: 'null'
|
||||||
|
- type: boolean
|
||||||
|
- type: number
|
||||||
|
- type: string
|
||||||
|
- type: array
|
||||||
|
- type: object
|
||||||
|
type: object
|
||||||
|
stop_reason:
|
||||||
|
enum:
|
||||||
|
- not_stopped
|
||||||
|
- finished_ok
|
||||||
|
- max_tokens
|
||||||
|
title: Stop reasons are used to indicate why the model stopped generating
|
||||||
|
text.
|
||||||
|
type: string
|
||||||
|
tool_calls:
|
||||||
|
items:
|
||||||
|
additionalProperties: false
|
||||||
|
properties:
|
||||||
|
arguments:
|
||||||
|
additionalProperties:
|
||||||
|
oneOf:
|
||||||
|
- type: 'null'
|
||||||
|
- type: boolean
|
||||||
|
- type: number
|
||||||
|
- type: string
|
||||||
|
- type: array
|
||||||
|
- type: object
|
||||||
|
type: object
|
||||||
|
tool_name:
|
||||||
|
type: string
|
||||||
|
required:
|
||||||
|
- tool_name
|
||||||
|
- arguments
|
||||||
|
title: A tool call is a request to a tool.
|
||||||
|
type: object
|
||||||
|
type: array
|
||||||
|
required:
|
||||||
|
- content
|
||||||
|
- stop_reason
|
||||||
|
- tool_calls
|
||||||
|
title: Normal chat completion response.
|
||||||
|
type: object
|
||||||
Attachment:
|
Attachment:
|
||||||
additionalProperties: false
|
additionalProperties: false
|
||||||
properties:
|
properties:
|
||||||
|
@ -17,6 +158,36 @@ components:
|
||||||
ChatCompletionRequest:
|
ChatCompletionRequest:
|
||||||
additionalProperties: false
|
additionalProperties: false
|
||||||
properties:
|
properties:
|
||||||
|
available_tools:
|
||||||
|
items:
|
||||||
|
oneOf:
|
||||||
|
- enum:
|
||||||
|
- web_search
|
||||||
|
- math
|
||||||
|
- image_gen
|
||||||
|
- code_interpreter
|
||||||
|
title: Builtin tools are tools the model is natively aware of and was
|
||||||
|
potentially fine-tuned with.
|
||||||
|
type: string
|
||||||
|
- additionalProperties: false
|
||||||
|
properties:
|
||||||
|
parameters:
|
||||||
|
additionalProperties:
|
||||||
|
oneOf:
|
||||||
|
- type: 'null'
|
||||||
|
- type: boolean
|
||||||
|
- type: number
|
||||||
|
- type: string
|
||||||
|
- type: array
|
||||||
|
- type: object
|
||||||
|
type: object
|
||||||
|
tool_name:
|
||||||
|
type: string
|
||||||
|
required:
|
||||||
|
- tool_name
|
||||||
|
- parameters
|
||||||
|
type: object
|
||||||
|
type: array
|
||||||
logprobs:
|
logprobs:
|
||||||
default: false
|
default: false
|
||||||
type: boolean
|
type: boolean
|
||||||
|
@ -64,6 +235,7 @@ components:
|
||||||
- message_history
|
- message_history
|
||||||
- model
|
- model
|
||||||
- sampling_params
|
- sampling_params
|
||||||
|
- available_tools
|
||||||
- max_tokens
|
- max_tokens
|
||||||
- stream
|
- stream
|
||||||
- logprobs
|
- logprobs
|
||||||
|
@ -122,7 +294,6 @@ components:
|
||||||
type: array
|
type: array
|
||||||
required:
|
required:
|
||||||
- content
|
- content
|
||||||
- stop_reason
|
|
||||||
- tool_calls
|
- tool_calls
|
||||||
title: Normal chat completion response.
|
title: Normal chat completion response.
|
||||||
type: object
|
type: object
|
||||||
|
@ -214,7 +385,6 @@ components:
|
||||||
type: string
|
type: string
|
||||||
required:
|
required:
|
||||||
- content
|
- content
|
||||||
- stop_reason
|
|
||||||
title: Normal completion response.
|
title: Normal completion response.
|
||||||
type: object
|
type: object
|
||||||
Message:
|
Message:
|
||||||
|
@ -258,27 +428,6 @@ components:
|
||||||
title: A tool call is a request to a tool.
|
title: A tool call is a request to a tool.
|
||||||
type: object
|
type: object
|
||||||
type: array
|
type: array
|
||||||
tool_definitions:
|
|
||||||
items:
|
|
||||||
additionalProperties: false
|
|
||||||
properties:
|
|
||||||
parameters:
|
|
||||||
additionalProperties:
|
|
||||||
oneOf:
|
|
||||||
- type: 'null'
|
|
||||||
- type: boolean
|
|
||||||
- type: number
|
|
||||||
- type: string
|
|
||||||
- type: array
|
|
||||||
- type: object
|
|
||||||
type: object
|
|
||||||
tool_name:
|
|
||||||
type: string
|
|
||||||
required:
|
|
||||||
- tool_name
|
|
||||||
- parameters
|
|
||||||
type: object
|
|
||||||
type: array
|
|
||||||
tool_responses:
|
tool_responses:
|
||||||
items:
|
items:
|
||||||
additionalProperties: false
|
additionalProperties: false
|
||||||
|
@ -295,11 +444,10 @@ components:
|
||||||
required:
|
required:
|
||||||
- role
|
- role
|
||||||
- content
|
- content
|
||||||
- tool_definitions
|
|
||||||
- tool_calls
|
- tool_calls
|
||||||
- tool_responses
|
- tool_responses
|
||||||
type: object
|
type: object
|
||||||
StreamedChatCompletionResponse:
|
StreamedAgenticSystemExecuteResponse:
|
||||||
additionalProperties: false
|
additionalProperties: false
|
||||||
properties:
|
properties:
|
||||||
stop_reason:
|
stop_reason:
|
||||||
|
@ -337,6 +485,43 @@ components:
|
||||||
- stop_reason
|
- stop_reason
|
||||||
title: Streamed chat completion response.
|
title: Streamed chat completion response.
|
||||||
type: object
|
type: object
|
||||||
|
StreamedChatCompletionResponse:
|
||||||
|
additionalProperties: false
|
||||||
|
properties:
|
||||||
|
stop_reason:
|
||||||
|
enum:
|
||||||
|
- not_stopped
|
||||||
|
- finished_ok
|
||||||
|
- max_tokens
|
||||||
|
title: Stop reasons are used to indicate why the model stopped generating
|
||||||
|
text.
|
||||||
|
type: string
|
||||||
|
text_delta:
|
||||||
|
type: string
|
||||||
|
tool_call:
|
||||||
|
additionalProperties: false
|
||||||
|
properties:
|
||||||
|
arguments:
|
||||||
|
additionalProperties:
|
||||||
|
oneOf:
|
||||||
|
- type: 'null'
|
||||||
|
- type: boolean
|
||||||
|
- type: number
|
||||||
|
- type: string
|
||||||
|
- type: array
|
||||||
|
- type: object
|
||||||
|
type: object
|
||||||
|
tool_name:
|
||||||
|
type: string
|
||||||
|
required:
|
||||||
|
- tool_name
|
||||||
|
- arguments
|
||||||
|
title: A tool call is a request to a tool.
|
||||||
|
type: object
|
||||||
|
required:
|
||||||
|
- text_delta
|
||||||
|
title: Streamed chat completion response.
|
||||||
|
type: object
|
||||||
StreamedCompletionResponse:
|
StreamedCompletionResponse:
|
||||||
additionalProperties: false
|
additionalProperties: false
|
||||||
properties:
|
properties:
|
||||||
|
@ -362,7 +547,6 @@ components:
|
||||||
type: string
|
type: string
|
||||||
required:
|
required:
|
||||||
- text_delta
|
- text_delta
|
||||||
- stop_reason
|
|
||||||
title: streamed completion response.
|
title: streamed completion response.
|
||||||
type: object
|
type: object
|
||||||
URL:
|
URL:
|
||||||
|
@ -377,15 +561,24 @@ jsonSchemaDialect: https://json-schema.org/draft/2020-12/schema
|
||||||
openapi: 3.1.0
|
openapi: 3.1.0
|
||||||
paths:
|
paths:
|
||||||
/agentic/system/execute:
|
/agentic/system/execute:
|
||||||
get:
|
post:
|
||||||
parameters: []
|
parameters: []
|
||||||
|
requestBody:
|
||||||
|
content:
|
||||||
|
application/json:
|
||||||
|
schema:
|
||||||
|
$ref: '#/components/schemas/AgenticSystemExecuteRequest'
|
||||||
|
required: true
|
||||||
responses:
|
responses:
|
||||||
'200':
|
'200':
|
||||||
content:
|
content:
|
||||||
application/json:
|
application/json:
|
||||||
schema:
|
schema:
|
||||||
type: string
|
oneOf:
|
||||||
description: OK
|
- $ref: '#/components/schemas/AgenticSystemExecuteResponse'
|
||||||
|
- $ref: '#/components/schemas/StreamedAgenticSystemExecuteResponse'
|
||||||
|
description: Normal chat completion response. **OR** Streamed chat completion
|
||||||
|
response.
|
||||||
tags:
|
tags:
|
||||||
- AgenticSystem
|
- AgenticSystem
|
||||||
/chat_completion:
|
/chat_completion:
|
||||||
|
@ -434,17 +627,17 @@ security:
|
||||||
servers:
|
servers:
|
||||||
- url: http://llama.meta.com
|
- url: http://llama.meta.com
|
||||||
tags:
|
tags:
|
||||||
- name: AgenticSystem
|
|
||||||
- name: Inference
|
- name: Inference
|
||||||
|
- name: AgenticSystem
|
||||||
|
- description: <SchemaDefinition schemaRef="#/components/schemas/AgenticSystemExecuteRequest"
|
||||||
|
/>
|
||||||
|
name: AgenticSystemExecuteRequest
|
||||||
- description: 'Attachments are used to refer to external resources, such as images,
|
- description: 'Attachments are used to refer to external resources, such as images,
|
||||||
videos, audio, etc.
|
videos, audio, etc.
|
||||||
|
|
||||||
|
|
||||||
<SchemaDefinition schemaRef="#/components/schemas/Attachment" />'
|
<SchemaDefinition schemaRef="#/components/schemas/Attachment" />'
|
||||||
name: Attachment
|
name: Attachment
|
||||||
- description: <SchemaDefinition schemaRef="#/components/schemas/ChatCompletionRequest"
|
|
||||||
/>
|
|
||||||
name: ChatCompletionRequest
|
|
||||||
- description: <SchemaDefinition schemaRef="#/components/schemas/Message" />
|
- description: <SchemaDefinition schemaRef="#/components/schemas/Message" />
|
||||||
name: Message
|
name: Message
|
||||||
- description: <SchemaDefinition schemaRef="#/components/schemas/URL" />
|
- description: <SchemaDefinition schemaRef="#/components/schemas/URL" />
|
||||||
|
@ -452,6 +645,21 @@ tags:
|
||||||
- description: 'Normal chat completion response.
|
- description: 'Normal chat completion response.
|
||||||
|
|
||||||
|
|
||||||
|
<SchemaDefinition schemaRef="#/components/schemas/AgenticSystemExecuteResponse"
|
||||||
|
/>'
|
||||||
|
name: AgenticSystemExecuteResponse
|
||||||
|
- description: 'Streamed chat completion response.
|
||||||
|
|
||||||
|
|
||||||
|
<SchemaDefinition schemaRef="#/components/schemas/StreamedAgenticSystemExecuteResponse"
|
||||||
|
/>'
|
||||||
|
name: StreamedAgenticSystemExecuteResponse
|
||||||
|
- description: <SchemaDefinition schemaRef="#/components/schemas/ChatCompletionRequest"
|
||||||
|
/>
|
||||||
|
name: ChatCompletionRequest
|
||||||
|
- description: 'Normal chat completion response.
|
||||||
|
|
||||||
|
|
||||||
<SchemaDefinition schemaRef="#/components/schemas/ChatCompletionResponse" />'
|
<SchemaDefinition schemaRef="#/components/schemas/ChatCompletionResponse" />'
|
||||||
name: ChatCompletionResponse
|
name: ChatCompletionResponse
|
||||||
- description: 'Streamed chat completion response.
|
- description: 'Streamed chat completion response.
|
||||||
|
@ -481,12 +689,15 @@ x-tagGroups:
|
||||||
- Inference
|
- Inference
|
||||||
- name: Types
|
- name: Types
|
||||||
tags:
|
tags:
|
||||||
|
- AgenticSystemExecuteRequest
|
||||||
|
- AgenticSystemExecuteResponse
|
||||||
- Attachment
|
- Attachment
|
||||||
- ChatCompletionRequest
|
- ChatCompletionRequest
|
||||||
- ChatCompletionResponse
|
- ChatCompletionResponse
|
||||||
- CompletionRequest
|
- CompletionRequest
|
||||||
- CompletionResponse
|
- CompletionResponse
|
||||||
- Message
|
- Message
|
||||||
|
- StreamedAgenticSystemExecuteResponse
|
||||||
- StreamedChatCompletionResponse
|
- StreamedChatCompletionResponse
|
||||||
- StreamedCompletionResponse
|
- StreamedCompletionResponse
|
||||||
- URL
|
- URL
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue