Flatten enums

2025-08-07 02:58:21 +00:00 · 2025-01-29 09:09:51 -08:00 · 2025-01-29 09:09:51 -08:00 · 3e2a751f54
commit 3e2a751f54
parent 62c3c5bb7e
5 changed files with 243 additions and 259 deletions
--- a/docs/resources/llama-stack-spec.html
+++ b/docs/resources/llama-stack-spec.html
@ -2337,15 +2337,6 @@
                    "rows"
                ]
            },
            "BuiltinTool": {
                "type": "string",
                "enum": [
                    "brave_search",
                    "wolfram_alpha",
                    "photogen",
                    "code_interpreter"
                ]
            },
            "CompletionMessage": {
                "type": "object",
                "properties": {
@ -2360,7 +2351,12 @@
                        "description": "The content of the model's response"
                    },
                    "stop_reason": {
-                        "$ref": "#/components/schemas/StopReason",
+                        "type": "string",
                        "enum": [
                            "end_of_turn",
                            "end_of_message",
                            "out_of_tokens"
                        ],
                        "description": "Reason why the model stopped generating. Options are: - `StopReason.end_of_turn`: The model finished generating the entire response. - `StopReason.end_of_message`: The model finished generating but generated a partial response -- usually, a tool call. The user may call the tool and continue the conversation with the tool's response. - `StopReason.out_of_tokens`: The model ran out of token budget."
                    },
                    "tool_calls": {
@ -2587,25 +2583,7 @@
                "type": "object",
                "properties": {
                    "strategy": {
-                        "oneOf": [
+                        "$ref": "#/components/schemas/SamplingStrategy"
                            {
                                "$ref": "#/components/schemas/GreedySamplingStrategy"
                            },
                            {
                                "$ref": "#/components/schemas/TopPSamplingStrategy"
                            },
                            {
                                "$ref": "#/components/schemas/TopKSamplingStrategy"
                            }
                        ],
                        "discriminator": {
                            "propertyName": "type",
                            "mapping": {
                                "greedy": "#/components/schemas/GreedySamplingStrategy",
                                "top_p": "#/components/schemas/TopPSamplingStrategy",
                                "top_k": "#/components/schemas/TopKSamplingStrategy"
                            }
                        }
                    },
                    "max_tokens": {
                        "type": "integer",
@ -2621,13 +2599,26 @@
                    "strategy"
                ]
            },
-            "StopReason": {
+            "SamplingStrategy": {
-                "type": "string",
+                "oneOf": [
-                "enum": [
+                    {
-                    "end_of_turn",
+                        "$ref": "#/components/schemas/GreedySamplingStrategy"
-                    "end_of_message",
+                    },
-                    "out_of_tokens"
+                    {
-                ]
+                        "$ref": "#/components/schemas/TopPSamplingStrategy"
                    },
                    {
                        "$ref": "#/components/schemas/TopKSamplingStrategy"
                    }
                ],
                "discriminator": {
                    "propertyName": "type",
                    "mapping": {
                        "greedy": "#/components/schemas/GreedySamplingStrategy",
                        "top_p": "#/components/schemas/TopPSamplingStrategy",
                        "top_k": "#/components/schemas/TopKSamplingStrategy"
                    }
                }
            },
            "SystemMessage": {
                "type": "object",
@ -2677,7 +2668,13 @@
                    "tool_name": {
                        "oneOf": [
                            {
-                                "$ref": "#/components/schemas/BuiltinTool"
+                                "type": "string",
                                "enum": [
                                    "brave_search",
                                    "wolfram_alpha",
                                    "photogen",
                                    "code_interpreter"
                                ]
                            },
                            {
                                "type": "string"
@ -2758,21 +2755,19 @@
                    "arguments"
                ]
            },
            "ToolChoice": {
                "type": "string",
                "enum": [
                    "auto",
                    "required"
                ],
                "title": "Whether tool use is required or automatic. This is a hint to the model which may not be followed. It depends on the Instruction Following capabilities of the model."
            },
            "ToolDefinition": {
                "type": "object",
                "properties": {
                    "tool_name": {
                        "oneOf": [
                            {
-                                "$ref": "#/components/schemas/BuiltinTool"
+                                "type": "string",
                                "enum": [
                                    "brave_search",
                                    "wolfram_alpha",
                                    "photogen",
                                    "code_interpreter"
                                ]
                            },
                            {
                                "type": "string"
@ -2835,16 +2830,6 @@
                    "param_type"
                ]
            },
            "ToolPromptFormat": {
                "type": "string",
                "enum": [
                    "json",
                    "function_tag",
                    "python_list"
                ],
                "title": "This Enum refers to the prompt format for calling custom / zero shot tools",
                "description": "`json` --\n    Refers to the json format for calling tools.\n    The json format takes the form like\n    {\n        \"type\": \"function\",\n        \"function\" : {\n            \"name\": \"function_name\",\n            \"description\": \"function_description\",\n            \"parameters\": {...}\n        }\n    }\n\n`function_tag` --\n    This is an example of how you could define\n    your own user defined format for making tool calls.\n    The function_tag format looks like this,\n    <function=function_name>(parameters)</function>\n\nThe detailed prompts for each of these formats are added to llama cli"
            },
            "ToolResponseMessage": {
                "type": "object",
                "properties": {
@ -2861,7 +2846,13 @@
                    "tool_name": {
                        "oneOf": [
                            {
-                                "$ref": "#/components/schemas/BuiltinTool"
+                                "type": "string",
                                "enum": [
                                    "brave_search",
                                    "wolfram_alpha",
                                    "photogen",
                                    "code_interpreter"
                                ]
                            },
                            {
                                "type": "string"
@ -2984,10 +2975,22 @@
                        }
                    },
                    "tool_choice": {
-                        "$ref": "#/components/schemas/ToolChoice"
+                        "type": "string",
                        "enum": [
                            "auto",
                            "required"
                        ],
                        "title": "Whether tool use is required or automatic. This is a hint to the model which may not be followed. It depends on the Instruction Following capabilities of the model."
                    },
                    "tool_prompt_format": {
-                        "$ref": "#/components/schemas/ToolPromptFormat"
+                        "type": "string",
                        "enum": [
                            "json",
                            "function_tag",
                            "python_list"
                        ],
                        "title": "This Enum refers to the prompt format for calling custom / zero shot tools",
                        "description": "The detailed prompts for each of these formats are added to llama cli"
                    },
                    "response_format": {
                        "$ref": "#/components/schemas/ResponseFormat"
@ -3122,7 +3125,12 @@
                        "description": "The generated completion text"
                    },
                    "stop_reason": {
-                        "$ref": "#/components/schemas/StopReason",
+                        "type": "string",
                        "enum": [
                            "end_of_turn",
                            "end_of_message",
                            "out_of_tokens"
                        ],
                        "description": "Reason why generation stopped"
                    },
                    "logprobs": {
@ -3178,11 +3186,20 @@
                        "description": "(Optional) List of tool definitions available to the model"
                    },
                    "tool_choice": {
-                        "$ref": "#/components/schemas/ToolChoice",
+                        "type": "string",
                        "enum": [
                            "auto",
                            "required"
                        ],
                        "description": "(Optional) Whether tool use is required or automatic. Defaults to ToolChoice.auto."
                    },
                    "tool_prompt_format": {
-                        "$ref": "#/components/schemas/ToolPromptFormat",
+                        "type": "string",
                        "enum": [
                            "json",
                            "function_tag",
                            "python_list"
                        ],
                        "description": "(Optional) Instructs the model how to format tool calls. By default, Llama Stack will attempt to use a format that is best adapted to the model. - `ToolPromptFormat.json`: The tool calls are formatted as a JSON object. - `ToolPromptFormat.function_tag`: The tool calls are enclosed in a <function=function_name> tag. - `ToolPromptFormat.python_list`: The tool calls are output as Python syntax -- a list of function calls."
                    },
                    "response_format": {
@ -3216,7 +3233,12 @@
                "type": "object",
                "properties": {
                    "event_type": {
-                        "$ref": "#/components/schemas/ChatCompletionResponseEventType",
+                        "type": "string",
                        "enum": [
                            "start",
                            "complete",
                            "progress"
                        ],
                        "description": "Type of the event"
                    },
                    "delta": {
@ -3231,7 +3253,12 @@
                        "description": "Optional log probabilities for generated tokens"
                    },
                    "stop_reason": {
-                        "$ref": "#/components/schemas/StopReason",
+                        "type": "string",
                        "enum": [
                            "end_of_turn",
                            "end_of_message",
                            "out_of_tokens"
                        ],
                        "description": "Optional reason why generation stopped, if complete"
                    }
                },
@ -3242,15 +3269,6 @@
                ],
                "title": "An event during chat completion generation."
            },
            "ChatCompletionResponseEventType": {
                "type": "string",
                "enum": [
                    "start",
                    "complete",
                    "progress"
                ],
                "title": "Types of events that can occur during chat completion."
            },
            "ChatCompletionResponseStreamChunk": {
                "type": "object",
                "properties": {
@ -3342,7 +3360,13 @@
                        ]
                    },
                    "parse_status": {
-                        "$ref": "#/components/schemas/ToolCallParseStatus"
+                        "type": "string",
                        "enum": [
                            "started",
                            "in_progress",
                            "failed",
                            "succeeded"
                        ]
                    }
                },
                "additionalProperties": false,
@ -3352,15 +3376,6 @@
                    "parse_status"
                ]
            },
            "ToolCallParseStatus": {
                "type": "string",
                "enum": [
                    "started",
                    "in_progress",
                    "failed",
                    "succeeded"
                ]
            },
            "CompletionRequest": {
                "type": "object",
                "properties": {
@ -3411,7 +3426,12 @@
                        "description": "New content generated since last chunk. This can be one or more tokens."
                    },
                    "stop_reason": {
-                        "$ref": "#/components/schemas/StopReason",
+                        "type": "string",
                        "enum": [
                            "end_of_turn",
                            "end_of_message",
                            "out_of_tokens"
                        ],
                        "description": "Optional reason why generation stopped, if complete"
                    },
                    "logprobs": {
@ -3459,11 +3479,23 @@
                        }
                    },
                    "tool_choice": {
-                        "$ref": "#/components/schemas/ToolChoice",
+                        "type": "string",
                        "enum": [
                            "auto",
                            "required"
                        ],
                        "title": "Whether tool use is required or automatic. This is a hint to the model which may not be followed. It depends on the Instruction Following capabilities of the model.",
                        "default": "auto"
                    },
                    "tool_prompt_format": {
-                        "$ref": "#/components/schemas/ToolPromptFormat"
+                        "type": "string",
                        "enum": [
                            "json",
                            "function_tag",
                            "python_list"
                        ],
                        "title": "This Enum refers to the prompt format for calling custom / zero shot tools",
                        "description": "The detailed prompts for each of these formats are added to llama cli"
                    },
                    "max_infer_iters": {
                        "type": "integer",
@ -4170,7 +4202,13 @@
                    "tool_name": {
                        "oneOf": [
                            {
-                                "$ref": "#/components/schemas/BuiltinTool"
+                                "type": "string",
                                "enum": [
                                    "brave_search",
                                    "wolfram_alpha",
                                    "photogen",
                                    "code_interpreter"
                                ]
                            },
                            {
                                "type": "string"
@ -7917,10 +7955,6 @@
            "name": "BooleanType",
            "description": ""
        },
        {
            "name": "BuiltinTool",
            "description": ""
        },
        {
            "name": "CancelTrainingJobRequest",
            "description": ""
@ -7941,10 +7975,6 @@
            "name": "ChatCompletionResponseEvent",
            "description": "An event during chat completion generation."
        },
        {
            "name": "ChatCompletionResponseEventType",
            "description": "Types of events that can occur during chat completion."
        },
        {
            "name": "ChatCompletionResponseStreamChunk",
            "description": "A chunk of a streamed chat completion response."
@ -8376,6 +8406,10 @@
            "name": "SamplingParams",
            "description": ""
        },
        {
            "name": "SamplingStrategy",
            "description": ""
        },
        {
            "name": "SaveSpansToDatasetRequest",
            "description": ""
@ -8449,10 +8483,6 @@
            "name": "SpanWithStatus",
            "description": ""
        },
        {
            "name": "StopReason",
            "description": ""
        },
        {
            "name": "StringType",
            "description": ""
@ -8511,14 +8541,6 @@
            "name": "ToolCallDelta",
            "description": ""
        },
        {
            "name": "ToolCallParseStatus",
            "description": ""
        },
        {
            "name": "ToolChoice",
            "description": "Whether tool use is required or automatic. This is a hint to the model which may not be followed. It depends on the Instruction Following capabilities of the model."
        },
        {
            "name": "ToolDef",
            "description": ""
@ -8554,10 +8576,6 @@
            "name": "ToolParameter",
            "description": ""
        },
        {
            "name": "ToolPromptFormat",
            "description": "This Enum refers to the prompt format for calling custom / zero shot tools\n\n`json` --\n    Refers to the json format for calling tools.\n    The json format takes the form like\n    {\n        \"type\": \"function\",\n        \"function\" : {\n            \"name\": \"function_name\",\n            \"description\": \"function_description\",\n            \"parameters\": {...}\n        }\n    }\n\n`function_tag` --\n    This is an example of how you could define\n    your own user defined format for making tool calls.\n    The function_tag format looks like this,\n    <function=function_name>(parameters)</function>\n\nThe detailed prompts for each of these formats are added to llama cli"
        },
        {
            "name": "ToolResponse",
            "description": ""
@ -8680,13 +8698,11 @@
                "BatchCompletionResponse",
                "BenchmarkEvalTaskConfig",
                "BooleanType",
                "BuiltinTool",
                "CancelTrainingJobRequest",
                "ChatCompletionInputType",
                "ChatCompletionRequest",
                "ChatCompletionResponse",
                "ChatCompletionResponseEvent",
                "ChatCompletionResponseEventType",
                "ChatCompletionResponseStreamChunk",
                "Checkpoint",
                "CompletionInputType",
@ -8788,6 +8804,7 @@
                "RunShieldResponse",
                "SafetyViolation",
                "SamplingParams",
                "SamplingStrategy",
                "SaveSpansToDatasetRequest",
                "ScoreBatchRequest",
                "ScoreBatchResponse",
@ -8804,7 +8821,6 @@
                "SpanStartPayload",
                "SpanStatus",
                "SpanWithStatus",
                "StopReason",
                "StringType",
                "StructuredLogEvent",
                "StructuredLogPayload",
@ -8818,8 +8834,6 @@
                "Tool",
                "ToolCall",
                "ToolCallDelta",
                "ToolCallParseStatus",
                "ToolChoice",
                "ToolDef",
                "ToolDefinition",
                "ToolExecutionStep",
@ -8828,7 +8842,6 @@
                "ToolInvocationResult",
                "ToolParamDefinition",
                "ToolParameter",
                "ToolPromptFormat",
                "ToolResponse",
                "ToolResponseMessage",
                "TopKSamplingStrategy",
--- a/docs/resources/llama-stack-spec.yaml
+++ b/docs/resources/llama-stack-spec.yaml
@ -1383,13 +1383,6 @@ components:
      required:
        - dataset_id
        - rows
    BuiltinTool:
      type: string
      enum:
        - brave_search
        - wolfram_alpha
        - photogen
        - code_interpreter
    CompletionMessage:
      type: object
      properties:
@ -1403,7 +1396,11 @@ components:
          $ref: '#/components/schemas/InterleavedContent'
          description: The content of the model's response
        stop_reason:
-          $ref: '#/components/schemas/StopReason'
+          type: string
          enum:
            - end_of_turn
            - end_of_message
            - out_of_tokens
          description: >-
            Reason why the model stopped generating. Options are: - `StopReason.end_of_turn`:
            The model finished generating the entire response. - `StopReason.end_of_message`:
@ -1552,16 +1549,7 @@ components:
      type: object
      properties:
        strategy:
-          oneOf:
+          $ref: '#/components/schemas/SamplingStrategy'
            - $ref: '#/components/schemas/GreedySamplingStrategy'
            - $ref: '#/components/schemas/TopPSamplingStrategy'
            - $ref: '#/components/schemas/TopKSamplingStrategy'
          discriminator:
            propertyName: type
            mapping:
              greedy: '#/components/schemas/GreedySamplingStrategy'
              top_p: '#/components/schemas/TopPSamplingStrategy'
              top_k: '#/components/schemas/TopKSamplingStrategy'
        max_tokens:
          type: integer
          default: 0
@ -1571,12 +1559,17 @@ components:
      additionalProperties: false
      required:
        - strategy
-    StopReason:
+    SamplingStrategy:
-      type: string
+      oneOf:
-      enum:
+        - $ref: '#/components/schemas/GreedySamplingStrategy'
-        - end_of_turn
+        - $ref: '#/components/schemas/TopPSamplingStrategy'
-        - end_of_message
+        - $ref: '#/components/schemas/TopKSamplingStrategy'
-        - out_of_tokens
+      discriminator:
        propertyName: type
        mapping:
          greedy: '#/components/schemas/GreedySamplingStrategy'
          top_p: '#/components/schemas/TopPSamplingStrategy'
          top_k: '#/components/schemas/TopKSamplingStrategy'
    SystemMessage:
      type: object
      properties:
@ -1618,7 +1611,12 @@ components:
          type: string
        tool_name:
          oneOf:
-            - $ref: '#/components/schemas/BuiltinTool'
+            - type: string
              enum:
                - brave_search
                - wolfram_alpha
                - photogen
                - code_interpreter
            - type: string
        arguments:
          type: object
@ -1650,21 +1648,17 @@ components:
        - call_id
        - tool_name
        - arguments
    ToolChoice:
      type: string
      enum:
        - auto
        - required
      title: >-
        Whether tool use is required or automatic. This is a hint to the model which
        may not be followed. It depends on the Instruction Following capabilities
        of the model.
    ToolDefinition:
      type: object
      properties:
        tool_name:
          oneOf:
-            - $ref: '#/components/schemas/BuiltinTool'
+            - type: string
              enum:
                - brave_search
                - wolfram_alpha
                - photogen
                - code_interpreter
            - type: string
        description:
          type: string
@ -1696,34 +1690,6 @@ components:
      additionalProperties: false
      required:
        - param_type
    ToolPromptFormat:
      type: string
      enum:
        - json
        - function_tag
        - python_list
      title: >-
        This Enum refers to the prompt format for calling custom / zero shot tools
      description: >-
        `json` --
            Refers to the json format for calling tools.
            The json format takes the form like
            {
                "type": "function",
                "function" : {
                    "name": "function_name",
                    "description": "function_description",
                    "parameters": {...}
                }
            }
        `function_tag` --
            This is an example of how you could define
            your own user defined format for making tool calls.
            The function_tag format looks like this,
            <function=function_name>(parameters)</function>
        The detailed prompts for each of these formats are added to llama cli
    ToolResponseMessage:
      type: object
      properties:
@ -1739,7 +1705,12 @@ components:
            Unique identifier for the tool call this response is for
        tool_name:
          oneOf:
-            - $ref: '#/components/schemas/BuiltinTool'
+            - type: string
              enum:
                - brave_search
                - wolfram_alpha
                - photogen
                - code_interpreter
            - type: string
          description: Name of the tool that was called
        content:
@ -1831,9 +1802,24 @@ components:
          items:
            $ref: '#/components/schemas/ToolDefinition'
        tool_choice:
-          $ref: '#/components/schemas/ToolChoice'
+          type: string
          enum:
            - auto
            - required
          title: >-
            Whether tool use is required or automatic. This is a hint to the model
            which may not be followed. It depends on the Instruction Following capabilities
            of the model.
        tool_prompt_format:
-          $ref: '#/components/schemas/ToolPromptFormat'
+          type: string
          enum:
            - json
            - function_tag
            - python_list
          title: >-
            This Enum refers to the prompt format for calling custom / zero shot tools
          description: >-
            The detailed prompts for each of these formats are added to llama cli
        response_format:
          $ref: '#/components/schemas/ResponseFormat'
        logprobs:
@ -1931,7 +1917,11 @@ components:
          type: string
          description: The generated completion text
        stop_reason:
-          $ref: '#/components/schemas/StopReason'
+          type: string
          enum:
            - end_of_turn
            - end_of_message
            - out_of_tokens
          description: Reason why generation stopped
        logprobs:
          type: array
@ -1976,11 +1966,18 @@ components:
          description: >-
            (Optional) List of tool definitions available to the model
        tool_choice:
-          $ref: '#/components/schemas/ToolChoice'
+          type: string
          enum:
            - auto
            - required
          description: >-
            (Optional) Whether tool use is required or automatic. Defaults to ToolChoice.auto.
        tool_prompt_format:
-          $ref: '#/components/schemas/ToolPromptFormat'
+          type: string
          enum:
            - json
            - function_tag
            - python_list
          description: >-
            (Optional) Instructs the model how to format tool calls. By default, Llama
            Stack will attempt to use a format that is best adapted to the model.
@ -2021,7 +2018,11 @@ components:
      type: object
      properties:
        event_type:
-          $ref: '#/components/schemas/ChatCompletionResponseEventType'
+          type: string
          enum:
            - start
            - complete
            - progress
          description: Type of the event
        delta:
          $ref: '#/components/schemas/ContentDelta'
@ -2035,7 +2036,11 @@ components:
          description: >-
            Optional log probabilities for generated tokens
        stop_reason:
-          $ref: '#/components/schemas/StopReason'
+          type: string
          enum:
            - end_of_turn
            - end_of_message
            - out_of_tokens
          description: >-
            Optional reason why generation stopped, if complete
      additionalProperties: false
@ -2044,14 +2049,6 @@ components:
        - delta
      title: >-
        An event during chat completion generation.
    ChatCompletionResponseEventType:
      type: string
      enum:
        - start
        - complete
        - progress
      title: >-
        Types of events that can occur during chat completion.
    ChatCompletionResponseStreamChunk:
      type: object
      properties:
@ -2113,19 +2110,17 @@ components:
            - type: string
            - $ref: '#/components/schemas/ToolCall'
        parse_status:
-          $ref: '#/components/schemas/ToolCallParseStatus'
+          type: string
          enum:
            - started
            - in_progress
            - failed
            - succeeded
      additionalProperties: false
      required:
        - type
        - tool_call
        - parse_status
    ToolCallParseStatus:
      type: string
      enum:
        - started
        - in_progress
        - failed
        - succeeded
    CompletionRequest:
      type: object
      properties:
@ -2174,7 +2169,11 @@ components:
          description: >-
            New content generated since last chunk. This can be one or more tokens.
        stop_reason:
-          $ref: '#/components/schemas/StopReason'
+          type: string
          enum:
            - end_of_turn
            - end_of_message
            - out_of_tokens
          description: >-
            Optional reason why generation stopped, if complete
        logprobs:
@ -2210,10 +2209,25 @@ components:
          items:
            $ref: '#/components/schemas/ToolDef'
        tool_choice:
-          $ref: '#/components/schemas/ToolChoice'
+          type: string
          enum:
            - auto
            - required
          title: >-
            Whether tool use is required or automatic. This is a hint to the model
            which may not be followed. It depends on the Instruction Following capabilities
            of the model.
          default: auto
        tool_prompt_format:
-          $ref: '#/components/schemas/ToolPromptFormat'
+          type: string
          enum:
            - json
            - function_tag
            - python_list
          title: >-
            This Enum refers to the prompt format for calling custom / zero shot tools
          description: >-
            The detailed prompts for each of these formats are added to llama cli
        max_infer_iters:
          type: integer
          default: 10
@ -2656,7 +2670,12 @@ components:
          type: string
        tool_name:
          oneOf:
-            - $ref: '#/components/schemas/BuiltinTool'
+            - type: string
              enum:
                - brave_search
                - wolfram_alpha
                - photogen
                - code_interpreter
            - type: string
        content:
          $ref: '#/components/schemas/InterleavedContent'
@ -4942,8 +4961,6 @@ tags:
    description: ''
  - name: BooleanType
    description: ''
  - name: BuiltinTool
    description: ''
  - name: CancelTrainingJobRequest
    description: ''
  - name: ChatCompletionInputType
@ -4955,9 +4972,6 @@ tags:
  - name: ChatCompletionResponseEvent
    description: >-
      An event during chat completion generation.
  - name: ChatCompletionResponseEventType
    description: >-
      Types of events that can occur during chat completion.
  - name: ChatCompletionResponseStreamChunk
    description: >-
      A chunk of a streamed chat completion response.
@ -5175,6 +5189,8 @@ tags:
    description: ''
  - name: SamplingParams
    description: ''
  - name: SamplingStrategy
    description: ''
  - name: SaveSpansToDatasetRequest
    description: ''
  - name: ScoreBatchRequest
@ -5212,8 +5228,6 @@ tags:
    description: ''
  - name: SpanWithStatus
    description: ''
  - name: StopReason
    description: ''
  - name: StringType
    description: ''
  - name: StructuredLogEvent
@ -5245,13 +5259,6 @@ tags:
    description: ''
  - name: ToolCallDelta
    description: ''
  - name: ToolCallParseStatus
    description: ''
  - name: ToolChoice
    description: >-
      Whether tool use is required or automatic. This is a hint to the model which
      may not be followed. It depends on the Instruction Following capabilities of
      the model.
  - name: ToolDef
    description: ''
  - name: ToolDefinition
@ -5269,30 +5276,6 @@ tags:
    description: ''
  - name: ToolParameter
    description: ''
  - name: ToolPromptFormat
    description: >-
      This Enum refers to the prompt format for calling custom / zero shot tools
      `json` --
          Refers to the json format for calling tools.
          The json format takes the form like
          {
              "type": "function",
              "function" : {
                  "name": "function_name",
                  "description": "function_description",
                  "parameters": {...}
              }
          }
      `function_tag` --
          This is an example of how you could define
          your own user defined format for making tool calls.
          The function_tag format looks like this,
          <function=function_name>(parameters)</function>
      The detailed prompts for each of these formats are added to llama cli
  - name: ToolResponse
    description: ''
  - name: ToolResponseMessage
@ -5379,13 +5362,11 @@ x-tagGroups:
      - BatchCompletionResponse
      - BenchmarkEvalTaskConfig
      - BooleanType
      - BuiltinTool
      - CancelTrainingJobRequest
      - ChatCompletionInputType
      - ChatCompletionRequest
      - ChatCompletionResponse
      - ChatCompletionResponseEvent
      - ChatCompletionResponseEventType
      - ChatCompletionResponseStreamChunk
      - Checkpoint
      - CompletionInputType
@ -5487,6 +5468,7 @@ x-tagGroups:
      - RunShieldResponse
      - SafetyViolation
      - SamplingParams
      - SamplingStrategy
      - SaveSpansToDatasetRequest
      - ScoreBatchRequest
      - ScoreBatchResponse
@ -5503,7 +5485,6 @@ x-tagGroups:
      - SpanStartPayload
      - SpanStatus
      - SpanWithStatus
      - StopReason
      - StringType
      - StructuredLogEvent
      - StructuredLogPayload
@ -5517,8 +5498,6 @@ x-tagGroups:
      - Tool
      - ToolCall
      - ToolCallDelta
      - ToolCallParseStatus
      - ToolChoice
      - ToolDef
      - ToolDefinition
      - ToolExecutionStep
@ -5527,7 +5506,6 @@ x-tagGroups:
      - ToolInvocationResult
      - ToolParamDefinition
      - ToolParameter
      - ToolPromptFormat
      - ToolResponse
      - ToolResponseMessage
      - TopKSamplingStrategy
--- a/llama_stack/apis/common/content_types.py
+++ b/llama_stack/apis/common/content_types.py
@ -77,7 +77,6 @@ class ImageDelta(BaseModel):
    image: bytes
@json_schema_type
 class ToolCallParseStatus(Enum):
    started = "started"
    in_progress = "in_progress"
--- a/llama_stack/apis/inference/inference.py
+++ b/llama_stack/apis/inference/inference.py
@ -43,7 +43,6 @@ class LogProbConfig(BaseModel):
    top_k: Optional[int] = 0
@json_schema_type
 class QuantizationType(Enum):
    """Type of model quantization to run inference with.
@ -177,7 +176,6 @@ class ToolResponse(BaseModel):
        return v
@json_schema_type
 class ToolChoice(Enum):
    """Whether tool use is required or automatic. This is a hint to the model which may not be followed. It depends on the Instruction Following capabilities of the model.
@ -199,7 +197,6 @@ class TokenLogProbs(BaseModel):
    logprobs_by_token: Dict[str, float]
@json_schema_type
 class ChatCompletionResponseEventType(Enum):
    """Types of events that can occur during chat completion.
@ -229,7 +226,6 @@ class ChatCompletionResponseEvent(BaseModel):
    stop_reason: Optional[StopReason] = None
@json_schema_type
 class ResponseFormatType(Enum):
    """Types of formats for structured (guided) decoding.
--- a/llama_stack/apis/resource.py
+++ b/llama_stack/apis/resource.py
@ -6,11 +6,9 @@
 from enum import Enum
 from llama_models.schema_utils import json_schema_type
 from pydantic import BaseModel, Field
@json_schema_type
 class ResourceType(Enum):
    model = "model"
    shield = "shield"