llama-stack-mirror/source/openapi.yaml

components:
  responses: {}
  schemas:
    AgenticSystemCreateRequest:
      additionalProperties: false
      properties:
        available_tools:
          items:
            oneOf:
            - enum:
              - web_search
              - math
              - image_gen
              - code_interpreter
              title: Builtin tools are tools the model is natively aware of and was
                potentially fine-tuned with.
              type: string
            - additionalProperties: false
              properties:
                parameters:
                  additionalProperties:
                    oneOf:
                    - type: 'null'
                    - type: boolean
                    - type: number
                    - type: string
                    - type: array
                    - type: object
                  type: object
                tool_name:
                  type: string
              required:
              - tool_name
              - parameters
              type: object
          type: array
        executable_tools:
          items:
            type: string
          type: array
          uniqueItems: true
        instructions:
          type: string
        model:
          enum:
          - llama3_8b_chat
          - llama3_70b_chat
          type: string
      required:
      - instructions
      - model
      - available_tools
      - executable_tools
      type: object
    AgenticSystemCreateResponse:
      additionalProperties: false
      properties:
        agent_id:
          type: string
      required:
      - agent_id
      type: object
    AgenticSystemExecuteRequest:
      additionalProperties: false
      properties:
        agent_id:
          type: string
        messages:
          items:
            $ref: '#/components/schemas/Message'
          type: array
        stream:
          default: false
          type: boolean
        turn_history:
          items:
            $ref: '#/components/schemas/AgenticSystemTurn'
          type: array
      required:
      - agent_id
      - messages
      - turn_history
      - stream
      type: object
    AgenticSystemExecuteResponse:
      additionalProperties: false
      properties:
        turn:
          $ref: '#/components/schemas/AgenticSystemTurn'
      required:
      - turn
      title: non-stream response from the agentic system.
      type: object
    AgenticSystemExecuteResponseStreamChunk:
      additionalProperties: false
      properties:
        stop_reason:
          enum:
          - not_stopped
          - finished_ok
          - max_tokens
          title: Stop reasons are used to indicate why the model stopped generating
            text.
          type: string
        turn:
          $ref: '#/components/schemas/AgenticSystemTurn'
      required:
      - turn
      title: Streamed agent execution response.
      type: object
    AgenticSystemTurn:
      additionalProperties: false
      properties:
        response_message:
          $ref: '#/components/schemas/Message'
        steps:
          items:
            oneOf:
            - additionalProperties: false
              properties:
                logprobs:
                  additionalProperties:
                    oneOf:
                    - type: 'null'
                    - type: boolean
                    - type: number
                    - type: string
                    - type: array
                    - type: object
                  type: object
                step_type:
                  default: model_inference
                  enum:
                  - model_inference
                  - tool_execution
                  - safety_filtering
                  - memory_retrieval
                  title: The type of execution step.
                  type: string
                text:
                  type: string
              required:
              - step_type
              - text
              type: object
            - additionalProperties: false
              properties:
                step_type:
                  default: tool_execution
                  enum:
                  - model_inference
                  - tool_execution
                  - safety_filtering
                  - memory_retrieval
                  title: The type of execution step.
                  type: string
                tool_calls:
                  items:
                    additionalProperties: false
                    properties:
                      arguments:
                        additionalProperties:
                          oneOf:
                          - type: 'null'
                          - type: boolean
                          - type: number
                          - type: string
                          - type: array
                          - type: object
                        type: object
                      tool_name:
                        type: string
                    required:
                    - tool_name
                    - arguments
                    title: A tool call is a request to a tool.
                    type: object
                  type: array
                tool_responses:
                  items:
                    additionalProperties: false
                    properties:
                      response:
                        type: string
                      tool_name:
                        type: string
                    required:
                    - tool_name
                    - response
                    type: object
                  type: array
              required:
              - step_type
              - tool_calls
              - tool_responses
              type: object
            - additionalProperties: false
              properties:
                step_type:
                  default: safety_filtering
                  enum:
                  - model_inference
                  - tool_execution
                  - safety_filtering
                  - memory_retrieval
                  title: The type of execution step.
                  type: string
                violation:
                  additionalProperties: false
                  properties:
                    details:
                      type: string
                    suggested_user_response:
                      type: string
                    violation_type:
                      type: string
                  required:
                  - violation_type
                  - details
                  type: object
              required:
              - step_type
              type: object
            - additionalProperties: false
              properties:
                documents:
                  items:
                    type: string
                  type: array
                scores:
                  items:
                    type: number
                  type: array
                step_type:
                  default: memory_retrieval
                  enum:
                  - model_inference
                  - tool_execution
                  - safety_filtering
                  - memory_retrieval
                  title: The type of execution step.
                  type: string
              required:
              - step_type
              - documents
              - scores
              type: object
          type: array
        user_messages:
          items:
            $ref: '#/components/schemas/Message'
          type: array
      required:
      - user_messages
      - steps
      - response_message
      title: A single turn in an interaction with an Agentic System.
      type: object
    Attachment:
      additionalProperties: false
      properties:
        mime_type:
          type: string
        url:
          $ref: '#/components/schemas/URL'
      required:
      - url
      - mime_type
      title: Attachments are used to refer to external resources, such as images,
        videos, audio, etc.
      type: object
    ChatCompletionRequest:
      additionalProperties: false
      properties:
        available_tools:
          items:
            oneOf:
            - enum:
              - web_search
              - math
              - image_gen
              - code_interpreter
              title: Builtin tools are tools the model is natively aware of and was
                potentially fine-tuned with.
              type: string
            - additionalProperties: false
              properties:
                parameters:
                  additionalProperties:
                    oneOf:
                    - type: 'null'
                    - type: boolean
                    - type: number
                    - type: string
                    - type: array
                    - type: object
                  type: object
                tool_name:
                  type: string
              required:
              - tool_name
              - parameters
              type: object
          type: array
        logprobs:
          default: false
          type: boolean
        max_tokens:
          default: 0
          type: integer
        message:
          $ref: '#/components/schemas/Message'
        message_history:
          items:
            $ref: '#/components/schemas/Message'
          type: array
        model:
          enum:
          - llama3_8b_chat
          - llama3_70b_chat
          type: string
        sampling_params:
          additionalProperties: false
          properties:
            strategy:
              default: greedy
              type: string
            temperature:
              default: 0.0
              type: number
            top_k:
              default: 0
              type: integer
            top_p:
              default: 0.95
              type: number
          required:
          - temperature
          - strategy
          - top_p
          - top_k
          type: object
        stream:
          default: false
          type: boolean
      required:
      - message
      - model
      - message_history
      - sampling_params
      - available_tools
      - max_tokens
      - stream
      - logprobs
      type: object
    ChatCompletionResponse:
      additionalProperties: false
      properties:
        content:
          oneOf:
          - type: string
          - $ref: '#/components/schemas/Attachment'
          - items:
              oneOf:
              - type: string
              - $ref: '#/components/schemas/Attachment'
            type: array
        logprobs:
          additionalProperties:
            oneOf:
            - type: 'null'
            - type: boolean
            - type: number
            - type: string
            - type: array
            - type: object
          type: object
        stop_reason:
          enum:
          - not_stopped
          - finished_ok
          - max_tokens
          title: Stop reasons are used to indicate why the model stopped generating
            text.
          type: string
        tool_calls:
          items:
            additionalProperties: false
            properties:
              arguments:
                additionalProperties:
                  oneOf:
                  - type: 'null'
                  - type: boolean
                  - type: number
                  - type: string
                  - type: array
                  - type: object
                type: object
              tool_name:
                type: string
            required:
            - tool_name
            - arguments
            title: A tool call is a request to a tool.
            type: object
          type: array
      required:
      - content
      - tool_calls
      title: Normal chat completion response.
      type: object
    ChatCompletionResponseStreamChunk:
      additionalProperties: false
      properties:
        stop_reason:
          enum:
          - not_stopped
          - finished_ok
          - max_tokens
          title: Stop reasons are used to indicate why the model stopped generating
            text.
          type: string
        text_delta:
          type: string
        tool_call:
          additionalProperties: false
          properties:
            arguments:
              additionalProperties:
                oneOf:
                - type: 'null'
                - type: boolean
                - type: number
                - type: string
                - type: array
                - type: object
              type: object
            tool_name:
              type: string
          required:
          - tool_name
          - arguments
          title: A tool call is a request to a tool.
          type: object
      required:
      - text_delta
      title: Streamed chat completion response. The actual response is a series of
        such objects.
      type: object
    CompletionRequest:
      additionalProperties: false
      properties:
        content:
          oneOf:
          - type: string
          - $ref: '#/components/schemas/Attachment'
          - items:
              oneOf:
              - type: string
              - $ref: '#/components/schemas/Attachment'
            type: array
        logprobs:
          default: false
          type: boolean
        max_tokens:
          default: 0
          type: integer
        model:
          enum:
          - llama3_8b
          - llama3_70b
          type: string
        sampling_params:
          additionalProperties: false
          properties:
            strategy:
              default: greedy
              type: string
            temperature:
              default: 0.0
              type: number
            top_k:
              default: 0
              type: integer
            top_p:
              default: 0.95
              type: number
          required:
          - temperature
          - strategy
          - top_p
          - top_k
          type: object
        stream:
          default: false
          type: boolean
      required:
      - content
      - model
      - sampling_params
      - max_tokens
      - stream
      - logprobs
      type: object
    CompletionResponse:
      additionalProperties: false
      properties:
        content:
          oneOf:
          - type: string
          - $ref: '#/components/schemas/Attachment'
          - items:
              oneOf:
              - type: string
              - $ref: '#/components/schemas/Attachment'
            type: array
        logprobs:
          additionalProperties:
            oneOf:
            - type: 'null'
            - type: boolean
            - type: number
            - type: string
            - type: array
            - type: object
          type: object
        stop_reason:
          enum:
          - not_stopped
          - finished_ok
          - max_tokens
          title: Stop reasons are used to indicate why the model stopped generating
            text.
          type: string
      required:
      - content
      title: Normal completion response.
      type: object
    CompletionResponseStreamChunk:
      additionalProperties: false
      properties:
        logprobs:
          additionalProperties:
            oneOf:
            - type: 'null'
            - type: boolean
            - type: number
            - type: string
            - type: array
            - type: object
          type: object
        stop_reason:
          enum:
          - not_stopped
          - finished_ok
          - max_tokens
          title: Stop reasons are used to indicate why the model stopped generating
            text.
          type: string
        text_delta:
          type: string
      required:
      - text_delta
      title: streamed completion response.
      type: object
    Message:
      additionalProperties: false
      properties:
        content:
          oneOf:
          - type: string
          - $ref: '#/components/schemas/Attachment'
          - items:
              oneOf:
              - type: string
              - $ref: '#/components/schemas/Attachment'
            type: array
        role:
          enum:
          - system
          - user
          - assistant
          - tool
          type: string
        tool_calls:
          items:
            additionalProperties: false
            properties:
              arguments:
                additionalProperties:
                  oneOf:
                  - type: 'null'
                  - type: boolean
                  - type: number
                  - type: string
                  - type: array
                  - type: object
                type: object
              tool_name:
                type: string
            required:
            - tool_name
            - arguments
            title: A tool call is a request to a tool.
            type: object
          type: array
        tool_responses:
          items:
            additionalProperties: false
            properties:
              response:
                type: string
              tool_name:
                type: string
            required:
            - tool_name
            - response
            type: object
          type: array
      required:
      - role
      - content
      - tool_calls
      - tool_responses
      type: object
    URL:
      format: uri
      pattern: ^(https?://|file://|data:)
      type: string
info:
  description: This is the llama stack
  title: Llama Stack specification
  version: '0.1'
jsonSchemaDialect: https://json-schema.org/draft/2020-12/schema
openapi: 3.1.0
paths:
  /agentic_system/create:
    post:
      parameters: []
      requestBody:
        content:
          application/json:
            schema:
              $ref: '#/components/schemas/AgenticSystemCreateRequest'
        required: true
      responses:
        '200':
          content:
            application/json:
              schema:
                $ref: '#/components/schemas/AgenticSystemCreateResponse'
          description: OK
      tags:
      - AgenticSystem
  /agentic_system/execute:
    post:
      parameters: []
      requestBody:
        content:
          application/json:
            schema:
              $ref: '#/components/schemas/AgenticSystemExecuteRequest'
        required: true
      responses:
        '200':
          content:
            application/json:
              schema:
                oneOf:
                - $ref: '#/components/schemas/AgenticSystemExecuteResponse'
                - $ref: '#/components/schemas/AgenticSystemExecuteResponseStreamChunk'
          description: non-stream response from the agentic system. **OR** Streamed
            agent execution response.
      tags:
      - AgenticSystem
  /chat_completion:
    post:
      parameters: []
      requestBody:
        content:
          application/json:
            schema:
              $ref: '#/components/schemas/ChatCompletionRequest'
        required: true
      responses:
        '200':
          content:
            application/json:
              schema:
                oneOf:
                - $ref: '#/components/schemas/ChatCompletionResponse'
                - $ref: '#/components/schemas/ChatCompletionResponseStreamChunk'
          description: Normal chat completion response. **OR** Streamed chat completion
            response. The actual response is a series of such objects.
      tags:
      - Inference
  /completion:
    post:
      parameters: []
      requestBody:
        content:
          application/json:
            schema:
              $ref: '#/components/schemas/CompletionRequest'
        required: true
      responses:
        '200':
          content:
            application/json:
              schema:
                oneOf:
                - $ref: '#/components/schemas/CompletionResponse'
                - $ref: '#/components/schemas/CompletionResponseStreamChunk'
          description: Normal completion response. **OR** streamed completion response.
      tags:
      - Inference
security:
- Default: []
servers:
- url: http://llama.meta.com
tags:
- name: Inference
- name: AgenticSystem
- description: <SchemaDefinition schemaRef="#/components/schemas/AgenticSystemCreateRequest"
    />
  name: AgenticSystemCreateRequest
- description: <SchemaDefinition schemaRef="#/components/schemas/AgenticSystemCreateResponse"
    />
  name: AgenticSystemCreateResponse
- description: <SchemaDefinition schemaRef="#/components/schemas/AgenticSystemExecuteRequest"
    />
  name: AgenticSystemExecuteRequest
- description: 'A single turn in an interaction with an Agentic System.


    <SchemaDefinition schemaRef="#/components/schemas/AgenticSystemTurn" />'
  name: AgenticSystemTurn
- description: 'Attachments are used to refer to external resources, such as images,
    videos, audio, etc.


    <SchemaDefinition schemaRef="#/components/schemas/Attachment" />'
  name: Attachment
- description: <SchemaDefinition schemaRef="#/components/schemas/Message" />
  name: Message
- description: <SchemaDefinition schemaRef="#/components/schemas/URL" />
  name: URL
- description: 'non-stream response from the agentic system.


    <SchemaDefinition schemaRef="#/components/schemas/AgenticSystemExecuteResponse"
    />'
  name: AgenticSystemExecuteResponse
- description: 'Streamed agent execution response.


    <SchemaDefinition schemaRef="#/components/schemas/AgenticSystemExecuteResponseStreamChunk"
    />'
  name: AgenticSystemExecuteResponseStreamChunk
- description: <SchemaDefinition schemaRef="#/components/schemas/ChatCompletionRequest"
    />
  name: ChatCompletionRequest
- description: 'Normal chat completion response.


    <SchemaDefinition schemaRef="#/components/schemas/ChatCompletionResponse" />'
  name: ChatCompletionResponse
- description: 'Streamed chat completion response. The actual response is a series
    of such objects.


    <SchemaDefinition schemaRef="#/components/schemas/ChatCompletionResponseStreamChunk"
    />'
  name: ChatCompletionResponseStreamChunk
- description: <SchemaDefinition schemaRef="#/components/schemas/CompletionRequest"
    />
  name: CompletionRequest
- description: 'Normal completion response.


    <SchemaDefinition schemaRef="#/components/schemas/CompletionResponse" />'
  name: CompletionResponse
- description: 'streamed completion response.


    <SchemaDefinition schemaRef="#/components/schemas/CompletionResponseStreamChunk"
    />'
  name: CompletionResponseStreamChunk
x-tagGroups:
- name: Operations
  tags:
  - AgenticSystem
  - Inference
- name: Types
  tags:
  - AgenticSystemCreateRequest
  - AgenticSystemCreateResponse
  - AgenticSystemExecuteRequest
  - AgenticSystemExecuteResponse
  - AgenticSystemExecuteResponseStreamChunk
  - AgenticSystemTurn
  - Attachment
  - ChatCompletionRequest
  - ChatCompletionResponse
  - ChatCompletionResponseStreamChunk
  - CompletionRequest
  - CompletionResponse
  - CompletionResponseStreamChunk
  - Message
  - URL