From 75ac0b2db1101484463f5148ab3759d41b505fb5 Mon Sep 17 00:00:00 2001 From: Xi Yan Date: Wed, 11 Sep 2024 14:17:57 -0700 Subject: [PATCH] re-generate openapi spec --- .../llama-stack-spec.html | 1112 ++++------------- .../llama-stack-spec.yaml | 802 +++--------- 2 files changed, 423 insertions(+), 1491 deletions(-) diff --git a/rfcs/RFC-0001-llama-stack-assets/llama-stack-spec.html b/rfcs/RFC-0001-llama-stack-assets/llama-stack-spec.html index abd0612e7..e611b2bc3 100644 --- a/rfcs/RFC-0001-llama-stack-assets/llama-stack-spec.html +++ b/rfcs/RFC-0001-llama-stack-assets/llama-stack-spec.html @@ -21,7 +21,7 @@ "info": { "title": "[DRAFT] Llama Stack Specification", "version": "0.0.1", - "description": "This is the specification of the llama stack that provides\n a set of endpoints and their corresponding interfaces that are tailored to\n best leverage Llama Models. The specification is still in draft and subject to change.\n Generated at 2024-09-11 12:34:17.939867" + "description": "This is the specification of the llama stack that provides\n a set of endpoints and their corresponding interfaces that are tailored to\n best leverage Llama Models. The specification is still in draft and subject to change.\n Generated at 2024-09-11 14:17:44.361462" }, "servers": [ { @@ -51,7 +51,7 @@ "content": { "application/json": { "schema": { - "$ref": "#/components/schemas/BatchChatCompletionRequestWrapper" + "$ref": "#/components/schemas/BatchChatCompletionRequest" } } }, @@ -81,7 +81,7 @@ "content": { "application/json": { "schema": { - "$ref": "#/components/schemas/BatchCompletionRequestWrapper" + "$ref": "#/components/schemas/BatchCompletionRequest" } } }, @@ -277,7 +277,7 @@ "content": { "application/json": { "schema": { - "$ref": "#/components/schemas/AgenticSystemTurnCreateRequestWrapper" + "$ref": "#/components/schemas/CreateAgenticSystemTurnRequest" } } }, @@ -300,7 +300,7 @@ "content": { "application/json": { "schema": { - "$ref": "#/components/schemas/CreateDatasetRequestWrapper" + "$ref": "#/components/schemas/CreateDatasetRequest" } } }, @@ -330,7 +330,7 @@ "content": { "application/json": { "schema": { - "$ref": "#/components/schemas/CreateExperimentRequestWrapper" + "$ref": "#/components/schemas/CreateExperimentRequest" } } }, @@ -390,7 +390,7 @@ "content": { "application/json": { "schema": { - "$ref": "#/components/schemas/CreateRunRequestWrapper" + "$ref": "#/components/schemas/CreateRunRequest" } } }, @@ -572,7 +572,7 @@ "content": { "application/json": { "schema": { - "$ref": "#/components/schemas/EvaluateQuestionAnsweringRequestWrapper" + "$ref": "#/components/schemas/EvaluateQuestionAnsweringRequest" } } }, @@ -602,7 +602,7 @@ "content": { "application/json": { "schema": { - "$ref": "#/components/schemas/EvaluateSummarizationRequestWrapper" + "$ref": "#/components/schemas/EvaluateSummarizationRequest" } } }, @@ -632,7 +632,7 @@ "content": { "application/json": { "schema": { - "$ref": "#/components/schemas/EvaluateTextGenerationRequestWrapper" + "$ref": "#/components/schemas/EvaluateTextGenerationRequest" } } }, @@ -1019,12 +1019,21 @@ "tags": [ "Telemetry" ], - "parameters": [], + "parameters": [ + { + "name": "query", + "in": "query", + "required": true, + "schema": { + "type": "string" + } + } + ], "requestBody": { "content": { "application/json": { "schema": { - "$ref": "#/components/schemas/LogSearchRequestWrapper" + "$ref": "#/components/schemas/GetLogsRequest" } } }, @@ -1312,7 +1321,7 @@ "content": { "application/json": { "schema": { - "$ref": "#/components/schemas/LogMessagesRequestWrapper" + "$ref": "#/components/schemas/LogMessagesRequest" } } }, @@ -1335,7 +1344,7 @@ "content": { "application/json": { "schema": { - "$ref": "#/components/schemas/LogMetricsRequestWrapper" + "$ref": "#/components/schemas/LogMetricsRequest" } } }, @@ -1365,7 +1374,7 @@ "content": { "application/json": { "schema": { - "$ref": "#/components/schemas/PostTrainingRLHFRequestWrapper" + "$ref": "#/components/schemas/PreferenceOptimizeRequest" } } }, @@ -1425,7 +1434,7 @@ "content": { "application/json": { "schema": { - "$ref": "#/components/schemas/RewardScoringRequestWrapper" + "$ref": "#/components/schemas/RewardScoreRequest" } } }, @@ -1455,7 +1464,7 @@ "content": { "application/json": { "schema": { - "$ref": "#/components/schemas/RunShieldRequestWrapper" + "$ref": "#/components/schemas/RunShieldsRequest" } } }, @@ -1485,7 +1494,7 @@ "content": { "application/json": { "schema": { - "$ref": "#/components/schemas/PostTrainingSFTRequestWrapper" + "$ref": "#/components/schemas/SupervisedFineTuneRequest" } } }, @@ -1515,7 +1524,7 @@ "content": { "application/json": { "schema": { - "$ref": "#/components/schemas/SyntheticDataGenerationRequestWrapper" + "$ref": "#/components/schemas/SyntheticDataGenerateRequest" } } }, @@ -1568,7 +1577,7 @@ "content": { "application/json": { "schema": { - "$ref": "#/components/schemas/UpdateExperimentRequestWrapper" + "$ref": "#/components/schemas/UpdateExperimentRequest" } } }, @@ -1598,7 +1607,7 @@ "content": { "application/json": { "schema": { - "$ref": "#/components/schemas/UpdateRunRequestWrapper" + "$ref": "#/components/schemas/UpdateRunRequest" } } }, @@ -1628,7 +1637,7 @@ "content": { "application/json": { "schema": { - "$ref": "#/components/schemas/UploadArtifactRequestWrapper" + "$ref": "#/components/schemas/UploadArtifactRequest" } } }, @@ -1640,65 +1649,6 @@ "jsonSchemaDialect": "https://json-schema.org/draft/2020-12/schema", "components": { "schemas": { - "BatchChatCompletionRequest": { - "type": "object", - "properties": { - "model": { - "type": "string" - }, - "messages_batch": { - "type": "array", - "items": { - "type": "array", - "items": { - "oneOf": [ - { - "$ref": "#/components/schemas/UserMessage" - }, - { - "$ref": "#/components/schemas/SystemMessage" - }, - { - "$ref": "#/components/schemas/ToolResponseMessage" - }, - { - "$ref": "#/components/schemas/CompletionMessage" - } - ] - } - } - }, - "sampling_params": { - "$ref": "#/components/schemas/SamplingParams" - }, - "tools": { - "type": "array", - "items": { - "$ref": "#/components/schemas/ToolDefinition" - } - }, - "tool_choice": { - "$ref": "#/components/schemas/ToolChoice" - }, - "tool_prompt_format": { - "$ref": "#/components/schemas/ToolPromptFormat" - }, - "logprobs": { - "type": "object", - "properties": { - "top_k": { - "type": "integer" - } - }, - "additionalProperties": false - } - }, - "additionalProperties": false, - "required": [ - "model", - "messages_batch" - ] - }, "BuiltinTool": { "type": "string", "enum": [ @@ -2050,16 +2000,63 @@ "content" ] }, - "BatchChatCompletionRequestWrapper": { + "BatchChatCompletionRequest": { "type": "object", "properties": { - "request": { - "$ref": "#/components/schemas/BatchChatCompletionRequest" + "model": { + "type": "string" + }, + "messages_batch": { + "type": "array", + "items": { + "type": "array", + "items": { + "oneOf": [ + { + "$ref": "#/components/schemas/UserMessage" + }, + { + "$ref": "#/components/schemas/SystemMessage" + }, + { + "$ref": "#/components/schemas/ToolResponseMessage" + }, + { + "$ref": "#/components/schemas/CompletionMessage" + } + ] + } + } + }, + "sampling_params": { + "$ref": "#/components/schemas/SamplingParams" + }, + "tools": { + "type": "array", + "items": { + "$ref": "#/components/schemas/ToolDefinition" + } + }, + "tool_choice": { + "$ref": "#/components/schemas/ToolChoice" + }, + "tool_prompt_format": { + "$ref": "#/components/schemas/ToolPromptFormat" + }, + "logprobs": { + "type": "object", + "properties": { + "top_k": { + "type": "integer" + } + }, + "additionalProperties": false } }, "additionalProperties": false, "required": [ - "request" + "model", + "messages_batch" ] }, "BatchChatCompletionResponse": { @@ -2118,18 +2115,6 @@ "content_batch" ] }, - "BatchCompletionRequestWrapper": { - "type": "object", - "properties": { - "request": { - "$ref": "#/components/schemas/BatchCompletionRequest" - } - }, - "additionalProperties": false, - "required": [ - "request" - ] - }, "BatchCompletionResponse": { "type": "object", "properties": { @@ -3007,234 +2992,38 @@ "session_id" ] }, - "AgenticSystemTurnCreateRequest": { + "Attachment": { "type": "object", "properties": { - "sampling_params": { - "$ref": "#/components/schemas/SamplingParams" - }, - "input_shields": { - "type": "array", - "items": { - "$ref": "#/components/schemas/ShieldDefinition" - } - }, - "output_shields": { - "type": "array", - "items": { - "$ref": "#/components/schemas/ShieldDefinition" - } - }, - "tools": { - "type": "array", - "items": { - "oneOf": [ - { - "$ref": "#/components/schemas/SearchToolDefinition" - }, - { - "$ref": "#/components/schemas/WolframAlphaToolDefinition" - }, - { - "$ref": "#/components/schemas/PhotogenToolDefinition" - }, - { - "$ref": "#/components/schemas/CodeInterpreterToolDefinition" - }, - { - "$ref": "#/components/schemas/FunctionCallToolDefinition" - }, - { - "type": "object", - "properties": { - "input_shields": { - "type": "array", - "items": { - "$ref": "#/components/schemas/ShieldDefinition" - } - }, - "output_shields": { - "type": "array", - "items": { - "$ref": "#/components/schemas/ShieldDefinition" - } - }, - "type": { - "type": "string", - "const": "memory" - }, - "memory_bank_configs": { - "type": "array", - "items": { - "oneOf": [ - { - "type": "object", - "properties": { - "bank_id": { - "type": "string" - }, - "type": { - "type": "string", - "const": "vector" - } - }, - "additionalProperties": false, - "required": [ - "bank_id", - "type" - ] - }, - { - "type": "object", - "properties": { - "bank_id": { - "type": "string" - }, - "type": { - "type": "string", - "const": "keyvalue" - }, - "keys": { - "type": "array", - "items": { - "type": "string" - } - } - }, - "additionalProperties": false, - "required": [ - "bank_id", - "type", - "keys" - ] - }, - { - "type": "object", - "properties": { - "bank_id": { - "type": "string" - }, - "type": { - "type": "string", - "const": "keyword" - } - }, - "additionalProperties": false, - "required": [ - "bank_id", - "type" - ] - }, - { - "type": "object", - "properties": { - "bank_id": { - "type": "string" - }, - "type": { - "type": "string", - "const": "graph" - }, - "entities": { - "type": "array", - "items": { - "type": "string" - } - } - }, - "additionalProperties": false, - "required": [ - "bank_id", - "type", - "entities" - ] - } - ] - } - }, - "query_generator_config": { - "oneOf": [ - { - "type": "object", - "properties": { - "type": { - "type": "string", - "const": "default" - }, - "sep": { - "type": "string" - } - }, - "additionalProperties": false, - "required": [ - "type", - "sep" - ] - }, - { - "type": "object", - "properties": { - "type": { - "type": "string", - "const": "llm" - }, - "model": { - "type": "string" - }, - "template": { - "type": "string" - } - }, - "additionalProperties": false, - "required": [ - "type", - "model", - "template" - ] - }, - { - "type": "object", - "properties": { - "type": { - "type": "string", - "const": "custom" - } - }, - "additionalProperties": false, - "required": [ - "type" - ] - } - ] - }, - "max_tokens_in_context": { - "type": "integer" - }, - "max_chunks": { - "type": "integer" - } - }, - "additionalProperties": false, - "required": [ - "type", - "memory_bank_configs", - "query_generator_config", - "max_tokens_in_context", - "max_chunks" - ] + "content": { + "oneOf": [ + { + "type": "string" + }, + { + "type": "array", + "items": { + "type": "string" } - ] - } + }, + { + "$ref": "#/components/schemas/URL" + } + ] }, - "tool_choice": { - "$ref": "#/components/schemas/ToolChoice" - }, - "tool_prompt_format": { - "$ref": "#/components/schemas/ToolPromptFormat" - }, - "instructions": { + "mime_type": { "type": "string" - }, + } + }, + "additionalProperties": false, + "required": [ + "content", + "mime_type" + ] + }, + "CreateAgenticSystemTurnRequest": { + "type": "object", + "properties": { "agent_id": { "type": "string" }, @@ -3271,47 +3060,6 @@ "messages" ] }, - "Attachment": { - "type": "object", - "properties": { - "content": { - "oneOf": [ - { - "type": "string" - }, - { - "type": "array", - "items": { - "type": "string" - } - }, - { - "$ref": "#/components/schemas/URL" - } - ] - }, - "mime_type": { - "type": "string" - } - }, - "additionalProperties": false, - "required": [ - "content", - "mime_type" - ] - }, - "AgenticSystemTurnCreateRequestWrapper": { - "type": "object", - "properties": { - "request": { - "$ref": "#/components/schemas/AgenticSystemTurnCreateRequest" - } - }, - "additionalProperties": false, - "required": [ - "request" - ] - }, "AgenticSystemTurnResponseEvent": { "type": "object", "properties": { @@ -3811,23 +3559,6 @@ ], "title": "A single turn in an interaction with an Agentic System." }, - "CreateDatasetRequest": { - "type": "object", - "properties": { - "uuid": { - "type": "string" - }, - "dataset": { - "$ref": "#/components/schemas/TrainEvalDataset" - } - }, - "additionalProperties": false, - "required": [ - "uuid", - "dataset" - ], - "title": "Request to create a dataset." - }, "TrainEvalDataset": { "type": "object", "properties": { @@ -3883,16 +3614,20 @@ "json" ] }, - "CreateDatasetRequestWrapper": { + "CreateDatasetRequest": { "type": "object", "properties": { - "request": { - "$ref": "#/components/schemas/CreateDatasetRequest" + "uuid": { + "type": "string" + }, + "dataset": { + "$ref": "#/components/schemas/TrainEvalDataset" } }, "additionalProperties": false, "required": [ - "request" + "uuid", + "dataset" ] }, "CreateExperimentRequest": { @@ -3932,18 +3667,6 @@ "name" ] }, - "CreateExperimentRequestWrapper": { - "type": "object", - "properties": { - "request": { - "$ref": "#/components/schemas/CreateExperimentRequest" - } - }, - "additionalProperties": false, - "required": [ - "request" - ] - }, "Experiment": { "type": "object", "properties": { @@ -4216,18 +3939,6 @@ "experiment_id" ] }, - "CreateRunRequestWrapper": { - "type": "object", - "properties": { - "request": { - "$ref": "#/components/schemas/CreateRunRequest" - } - }, - "additionalProperties": false, - "required": [ - "request" - ] - }, "Run": { "type": "object", "properties": { @@ -4401,24 +4112,9 @@ "embeddings" ] }, - "Checkpoint": { - "description": "Checkpoint created during training runs" - }, "EvaluateQuestionAnsweringRequest": { "type": "object", "properties": { - "job_uuid": { - "type": "string" - }, - "dataset": { - "$ref": "#/components/schemas/TrainEvalDataset" - }, - "checkpoint": { - "$ref": "#/components/schemas/Checkpoint" - }, - "sampling_params": { - "$ref": "#/components/schemas/SamplingParams" - }, "metrics": { "type": "array", "items": { @@ -4432,24 +4128,7 @@ }, "additionalProperties": false, "required": [ - "job_uuid", - "dataset", - "checkpoint", - "sampling_params", "metrics" - ], - "title": "Request to evaluate question answering." - }, - "EvaluateQuestionAnsweringRequestWrapper": { - "type": "object", - "properties": { - "request": { - "$ref": "#/components/schemas/EvaluateQuestionAnsweringRequest" - } - }, - "additionalProperties": false, - "required": [ - "request" ] }, "EvaluationJob": { @@ -4467,18 +4146,6 @@ "EvaluateSummarizationRequest": { "type": "object", "properties": { - "job_uuid": { - "type": "string" - }, - "dataset": { - "$ref": "#/components/schemas/TrainEvalDataset" - }, - "checkpoint": { - "$ref": "#/components/schemas/Checkpoint" - }, - "sampling_params": { - "$ref": "#/components/schemas/SamplingParams" - }, "metrics": { "type": "array", "items": { @@ -4492,41 +4159,12 @@ }, "additionalProperties": false, "required": [ - "job_uuid", - "dataset", - "checkpoint", - "sampling_params", "metrics" - ], - "title": "Request to evaluate summarization." - }, - "EvaluateSummarizationRequestWrapper": { - "type": "object", - "properties": { - "request": { - "$ref": "#/components/schemas/EvaluateSummarizationRequest" - } - }, - "additionalProperties": false, - "required": [ - "request" ] }, "EvaluateTextGenerationRequest": { "type": "object", "properties": { - "job_uuid": { - "type": "string" - }, - "dataset": { - "$ref": "#/components/schemas/TrainEvalDataset" - }, - "checkpoint": { - "$ref": "#/components/schemas/Checkpoint" - }, - "sampling_params": { - "$ref": "#/components/schemas/SamplingParams" - }, "metrics": { "type": "array", "items": { @@ -4541,24 +4179,7 @@ }, "additionalProperties": false, "required": [ - "job_uuid", - "dataset", - "checkpoint", - "sampling_params", "metrics" - ], - "title": "Request to evaluate text generation." - }, - "EvaluateTextGenerationRequestWrapper": { - "type": "object", - "properties": { - "request": { - "$ref": "#/components/schemas/EvaluateTextGenerationRequest" - } - }, - "additionalProperties": false, - "required": [ - "request" ] }, "GetAgenticSystemSessionRequest": { @@ -4809,12 +4430,9 @@ "job_uuid" ] }, - "LogSearchRequest": { + "GetLogsRequest": { "type": "object", "properties": { - "query": { - "type": "string" - }, "filters": { "type": "object", "additionalProperties": { @@ -4841,22 +4459,7 @@ } } }, - "additionalProperties": false, - "required": [ - "query" - ] - }, - "LogSearchRequestWrapper": { - "type": "object", - "properties": { - "request": { - "$ref": "#/components/schemas/LogSearchRequest" - } - }, - "additionalProperties": false, - "required": [ - "request" - ] + "additionalProperties": false }, "Log": { "type": "object", @@ -4943,6 +4546,9 @@ "run_id" ] }, + "Checkpoint": { + "description": "Checkpoint created during training runs" + }, "PostTrainingJobArtifactsResponse": { "type": "object", "properties": { @@ -5117,18 +4723,6 @@ "logs" ] }, - "LogMessagesRequestWrapper": { - "type": "object", - "properties": { - "request": { - "$ref": "#/components/schemas/LogMessagesRequest" - } - }, - "additionalProperties": false, - "required": [ - "request" - ] - }, "LogMetricsRequest": { "type": "object", "properties": { @@ -5148,18 +4742,6 @@ "metrics" ] }, - "LogMetricsRequestWrapper": { - "type": "object", - "properties": { - "request": { - "$ref": "#/components/schemas/LogMetricsRequest" - } - }, - "additionalProperties": false, - "required": [ - "request" - ] - }, "DPOAlignmentConfig": { "type": "object", "properties": { @@ -5213,7 +4795,49 @@ "weight_decay" ] }, - "PostTrainingRLHFRequest": { + "RLHFAlgorithm": { + "type": "string", + "enum": [ + "dpo" + ] + }, + "TrainingConfig": { + "type": "object", + "properties": { + "n_epochs": { + "type": "integer" + }, + "batch_size": { + "type": "integer" + }, + "shuffle": { + "type": "boolean" + }, + "n_iters": { + "type": "integer" + }, + "enable_activation_checkpointing": { + "type": "boolean" + }, + "memory_efficient_fsdp_wrap": { + "type": "boolean" + }, + "fsdp_cpu_offload": { + "type": "boolean" + } + }, + "additionalProperties": false, + "required": [ + "n_epochs", + "batch_size", + "shuffle", + "n_iters", + "enable_activation_checkpointing", + "memory_efficient_fsdp_wrap", + "fsdp_cpu_offload" + ] + }, + "PreferenceOptimizeRequest": { "type": "object", "properties": { "job_uuid": { @@ -5303,61 +4927,6 @@ "training_config", "hyperparam_search_config", "logger_config" - ], - "title": "Request to finetune a model." - }, - "RLHFAlgorithm": { - "type": "string", - "enum": [ - "dpo" - ] - }, - "TrainingConfig": { - "type": "object", - "properties": { - "n_epochs": { - "type": "integer" - }, - "batch_size": { - "type": "integer" - }, - "shuffle": { - "type": "boolean" - }, - "n_iters": { - "type": "integer" - }, - "enable_activation_checkpointing": { - "type": "boolean" - }, - "memory_efficient_fsdp_wrap": { - "type": "boolean" - }, - "fsdp_cpu_offload": { - "type": "boolean" - } - }, - "additionalProperties": false, - "required": [ - "n_epochs", - "batch_size", - "shuffle", - "n_iters", - "enable_activation_checkpointing", - "memory_efficient_fsdp_wrap", - "fsdp_cpu_offload" - ] - }, - "PostTrainingRLHFRequestWrapper": { - "type": "object", - "properties": { - "request": { - "$ref": "#/components/schemas/PostTrainingRLHFRequest" - } - }, - "additionalProperties": false, - "required": [ - "request" ] }, "QueryDocumentsRequest": { @@ -5508,7 +5077,7 @@ "sampled_generations" ] }, - "RewardScoringRequest": { + "RewardScoreRequest": { "type": "object", "properties": { "dialog_generations": { @@ -5525,19 +5094,6 @@ "required": [ "dialog_generations", "model" - ], - "title": "Request to score a reward function. A list of prompts and a list of responses per prompt." - }, - "RewardScoringRequestWrapper": { - "type": "object", - "properties": { - "request": { - "$ref": "#/components/schemas/RewardScoringRequest" - } - }, - "additionalProperties": false, - "required": [ - "request" ] }, "RewardScoringResponse": { @@ -5620,7 +5176,7 @@ "score" ] }, - "RunShieldRequest": { + "RunShieldsRequest": { "type": "object", "properties": { "messages": { @@ -5655,18 +5211,6 @@ "shields" ] }, - "RunShieldRequestWrapper": { - "type": "object", - "properties": { - "request": { - "$ref": "#/components/schemas/RunShieldRequest" - } - }, - "additionalProperties": false, - "required": [ - "request" - ] - }, "RunShieldResponse": { "type": "object", "properties": { @@ -5753,7 +5297,38 @@ "alpha" ] }, - "PostTrainingSFTRequest": { + "QLoraFinetuningConfig": { + "type": "object", + "properties": { + "lora_attn_modules": { + "type": "array", + "items": { + "type": "string" + } + }, + "apply_lora_to_mlp": { + "type": "boolean" + }, + "apply_lora_to_output": { + "type": "boolean" + }, + "rank": { + "type": "integer" + }, + "alpha": { + "type": "integer" + } + }, + "additionalProperties": false, + "required": [ + "lora_attn_modules", + "apply_lora_to_mlp", + "apply_lora_to_output", + "rank", + "alpha" + ] + }, + "SupervisedFineTuneRequest": { "type": "object", "properties": { "job_uuid": { @@ -5853,53 +5428,9 @@ "training_config", "hyperparam_search_config", "logger_config" - ], - "title": "Request to finetune a model." - }, - "QLoraFinetuningConfig": { - "type": "object", - "properties": { - "lora_attn_modules": { - "type": "array", - "items": { - "type": "string" - } - }, - "apply_lora_to_mlp": { - "type": "boolean" - }, - "apply_lora_to_output": { - "type": "boolean" - }, - "rank": { - "type": "integer" - }, - "alpha": { - "type": "integer" - } - }, - "additionalProperties": false, - "required": [ - "lora_attn_modules", - "apply_lora_to_mlp", - "apply_lora_to_output", - "rank", - "alpha" ] }, - "PostTrainingSFTRequestWrapper": { - "type": "object", - "properties": { - "request": { - "$ref": "#/components/schemas/PostTrainingSFTRequest" - } - }, - "additionalProperties": false, - "required": [ - "request" - ] - }, - "SyntheticDataGenerationRequest": { + "SyntheticDataGenerateRequest": { "type": "object", "properties": { "dialogs": { @@ -5941,19 +5472,6 @@ "required": [ "dialogs", "filtering_function" - ], - "title": "Request to generate synthetic data. A small batch of prompts and a filtering function" - }, - "SyntheticDataGenerationRequestWrapper": { - "type": "object", - "properties": { - "request": { - "$ref": "#/components/schemas/SyntheticDataGenerationRequest" - } - }, - "additionalProperties": false, - "required": [ - "request" ] }, "SyntheticDataGenerationResponse": { @@ -6056,18 +5574,6 @@ "experiment_id" ] }, - "UpdateExperimentRequestWrapper": { - "type": "object", - "properties": { - "request": { - "$ref": "#/components/schemas/UpdateExperimentRequest" - } - }, - "additionalProperties": false, - "required": [ - "request" - ] - }, "UpdateRunRequest": { "type": "object", "properties": { @@ -6112,18 +5618,6 @@ "run_id" ] }, - "UpdateRunRequestWrapper": { - "type": "object", - "properties": { - "request": { - "$ref": "#/components/schemas/UpdateRunRequest" - } - }, - "additionalProperties": false, - "required": [ - "request" - ] - }, "UploadArtifactRequest": { "type": "object", "properties": { @@ -6173,18 +5667,6 @@ "artifact_type", "content" ] - }, - "UploadArtifactRequestWrapper": { - "type": "object", - "properties": { - "request": { - "$ref": "#/components/schemas/UploadArtifactRequest" - } - }, - "additionalProperties": false, - "required": [ - "request" - ] } }, "responses": {} @@ -6195,17 +5677,17 @@ } ], "tags": [ + { + "name": "Telemetry" + }, + { + "name": "Evaluations" + }, { "name": "PostTraining" }, { - "name": "RewardScoring" - }, - { - "name": "Safety" - }, - { - "name": "Memory" + "name": "Datasets" }, { "name": "SyntheticDataGeneration" @@ -6213,24 +5695,20 @@ { "name": "BatchInference" }, - { - "name": "AgenticSystem" - }, - { - "name": "Telemetry" - }, - { - "name": "Evaluations" - }, { "name": "Inference" }, { - "name": "Datasets" + "name": "AgenticSystem" }, { - "name": "BatchChatCompletionRequest", - "description": "" + "name": "Safety" + }, + { + "name": "Memory" + }, + { + "name": "RewardScoring" }, { "name": "BuiltinTool", @@ -6285,8 +5763,8 @@ "description": "" }, { - "name": "BatchChatCompletionRequestWrapper", - "description": "" + "name": "BatchChatCompletionRequest", + "description": "" }, { "name": "BatchChatCompletionResponse", @@ -6296,10 +5774,6 @@ "name": "BatchCompletionRequest", "description": "" }, - { - "name": "BatchCompletionRequestWrapper", - "description": "" - }, { "name": "BatchCompletionResponse", "description": "" @@ -6412,17 +5886,13 @@ "name": "AgenticSystemSessionCreateResponse", "description": "" }, - { - "name": "AgenticSystemTurnCreateRequest", - "description": "" - }, { "name": "Attachment", "description": "" }, { - "name": "AgenticSystemTurnCreateRequestWrapper", - "description": "" + "name": "CreateAgenticSystemTurnRequest", + "description": "" }, { "name": "AgenticSystemTurnResponseEvent", @@ -6480,10 +5950,6 @@ "name": "Turn", "description": "A single turn in an interaction with an Agentic System.\n\n" }, - { - "name": "CreateDatasetRequest", - "description": "Request to create a dataset.\n\n" - }, { "name": "TrainEvalDataset", "description": "Dataset to be used for training or evaluating language models.\n\n" @@ -6493,17 +5959,13 @@ "description": "" }, { - "name": "CreateDatasetRequestWrapper", - "description": "" + "name": "CreateDatasetRequest", + "description": "" }, { "name": "CreateExperimentRequest", "description": "" }, - { - "name": "CreateExperimentRequestWrapper", - "description": "" - }, { "name": "Experiment", "description": "" @@ -6524,10 +5986,6 @@ "name": "CreateRunRequest", "description": "" }, - { - "name": "CreateRunRequestWrapper", - "description": "" - }, { "name": "Run", "description": "" @@ -6560,17 +6018,9 @@ "name": "EmbeddingsResponse", "description": "" }, - { - "name": "Checkpoint", - "description": "Checkpoint created during training runs\n\n" - }, { "name": "EvaluateQuestionAnsweringRequest", - "description": "Request to evaluate question answering.\n\n" - }, - { - "name": "EvaluateQuestionAnsweringRequestWrapper", - "description": "" + "description": "" }, { "name": "EvaluationJob", @@ -6578,19 +6028,11 @@ }, { "name": "EvaluateSummarizationRequest", - "description": "Request to evaluate summarization.\n\n" - }, - { - "name": "EvaluateSummarizationRequestWrapper", - "description": "" + "description": "" }, { "name": "EvaluateTextGenerationRequest", - "description": "Request to evaluate text generation.\n\n" - }, - { - "name": "EvaluateTextGenerationRequestWrapper", - "description": "" + "description": "" }, { "name": "GetAgenticSystemSessionRequest", @@ -6633,12 +6075,8 @@ "description": "" }, { - "name": "LogSearchRequest", - "description": "" - }, - { - "name": "LogSearchRequestWrapper", - "description": "" + "name": "GetLogsRequest", + "description": "" }, { "name": "Log", @@ -6648,6 +6086,10 @@ "name": "Metric", "description": "" }, + { + "name": "Checkpoint", + "description": "Checkpoint created during training runs\n\n" + }, { "name": "PostTrainingJobArtifactsResponse", "description": "Artifacts of a finetuning job.\n\n" @@ -6680,18 +6122,10 @@ "name": "LogMessagesRequest", "description": "" }, - { - "name": "LogMessagesRequestWrapper", - "description": "" - }, { "name": "LogMetricsRequest", "description": "" }, - { - "name": "LogMetricsRequestWrapper", - "description": "" - }, { "name": "DPOAlignmentConfig", "description": "" @@ -6700,10 +6134,6 @@ "name": "OptimizerConfig", "description": "" }, - { - "name": "PostTrainingRLHFRequest", - "description": "Request to finetune a model.\n\n" - }, { "name": "RLHFAlgorithm", "description": "" @@ -6713,8 +6143,8 @@ "description": "" }, { - "name": "PostTrainingRLHFRequestWrapper", - "description": "" + "name": "PreferenceOptimizeRequest", + "description": "" }, { "name": "QueryDocumentsRequest", @@ -6729,12 +6159,8 @@ "description": "" }, { - "name": "RewardScoringRequest", - "description": "Request to score a reward function. A list of prompts and a list of responses per prompt.\n\n" - }, - { - "name": "RewardScoringRequestWrapper", - "description": "" + "name": "RewardScoreRequest", + "description": "" }, { "name": "RewardScoringResponse", @@ -6749,12 +6175,8 @@ "description": "" }, { - "name": "RunShieldRequest", - "description": "" - }, - { - "name": "RunShieldRequestWrapper", - "description": "" + "name": "RunShieldsRequest", + "description": "" }, { "name": "RunShieldResponse", @@ -6772,25 +6194,17 @@ "name": "LoraFinetuningConfig", "description": "" }, - { - "name": "PostTrainingSFTRequest", - "description": "Request to finetune a model.\n\n" - }, { "name": "QLoraFinetuningConfig", "description": "" }, { - "name": "PostTrainingSFTRequestWrapper", - "description": "" + "name": "SupervisedFineTuneRequest", + "description": "" }, { - "name": "SyntheticDataGenerationRequest", - "description": "Request to generate synthetic data. A small batch of prompts and a filtering function\n\n" - }, - { - "name": "SyntheticDataGenerationRequestWrapper", - "description": "" + "name": "SyntheticDataGenerateRequest", + "description": "" }, { "name": "SyntheticDataGenerationResponse", @@ -6804,25 +6218,13 @@ "name": "UpdateExperimentRequest", "description": "" }, - { - "name": "UpdateExperimentRequestWrapper", - "description": "" - }, { "name": "UpdateRunRequest", "description": "" }, - { - "name": "UpdateRunRequestWrapper", - "description": "" - }, { "name": "UploadArtifactRequest", "description": "" - }, - { - "name": "UploadArtifactRequestWrapper", - "description": "" } ], "x-tagGroups": [ @@ -6849,8 +6251,6 @@ "AgenticSystemCreateResponse", "AgenticSystemSessionCreateResponse", "AgenticSystemStepResponse", - "AgenticSystemTurnCreateRequest", - "AgenticSystemTurnCreateRequestWrapper", "AgenticSystemTurnResponseEvent", "AgenticSystemTurnResponseStepCompletePayload", "AgenticSystemTurnResponseStepProgressPayload", @@ -6862,10 +6262,8 @@ "ArtifactType", "Attachment", "BatchChatCompletionRequest", - "BatchChatCompletionRequestWrapper", "BatchChatCompletionResponse", "BatchCompletionRequest", - "BatchCompletionRequestWrapper", "BatchCompletionResponse", "BuiltinShield", "BuiltinTool", @@ -6882,13 +6280,11 @@ "CompletionResponseStreamChunk", "CreateAgenticSystemRequest", "CreateAgenticSystemSessionRequest", + "CreateAgenticSystemTurnRequest", "CreateDatasetRequest", - "CreateDatasetRequestWrapper", "CreateExperimentRequest", - "CreateExperimentRequestWrapper", "CreateMemoryBankRequest", "CreateRunRequest", - "CreateRunRequestWrapper", "DPOAlignmentConfig", "DeleteAgenticSystemRequest", "DeleteAgenticSystemSessionRequest", @@ -6900,11 +6296,8 @@ "EmbeddingsRequest", "EmbeddingsResponse", "EvaluateQuestionAnsweringRequest", - "EvaluateQuestionAnsweringRequestWrapper", "EvaluateSummarizationRequest", - "EvaluateSummarizationRequestWrapper", "EvaluateTextGenerationRequest", - "EvaluateTextGenerationRequestWrapper", "EvaluationJob", "EvaluationJobArtifactsResponse", "EvaluationJobLogStream", @@ -6915,16 +6308,13 @@ "FunctionCallToolDefinition", "GetAgenticSystemSessionRequest", "GetDocumentsRequest", + "GetLogsRequest", "InferenceStep", "InsertDocumentsRequest", "ListArtifactsRequest", "Log", "LogMessagesRequest", - "LogMessagesRequestWrapper", "LogMetricsRequest", - "LogMetricsRequestWrapper", - "LogSearchRequest", - "LogSearchRequestWrapper", "LoraFinetuningConfig", "MemoryBank", "MemoryBankDocument", @@ -6938,23 +6328,18 @@ "PostTrainingJobLogStream", "PostTrainingJobStatus", "PostTrainingJobStatusResponse", - "PostTrainingRLHFRequest", - "PostTrainingRLHFRequestWrapper", - "PostTrainingSFTRequest", - "PostTrainingSFTRequestWrapper", + "PreferenceOptimizeRequest", "QLoraFinetuningConfig", "QueryDocumentsRequest", "QueryDocumentsResponse", "RLHFAlgorithm", "RestAPIExecutionConfig", "RestAPIMethod", - "RewardScoringRequest", - "RewardScoringRequestWrapper", + "RewardScoreRequest", "RewardScoringResponse", "Run", - "RunShieldRequest", - "RunShieldRequestWrapper", "RunShieldResponse", + "RunShieldsRequest", "SamplingParams", "SamplingStrategy", "ScoredDialogGenerations", @@ -6965,8 +6350,8 @@ "ShieldDefinition", "ShieldResponse", "StopReason", - "SyntheticDataGenerationRequest", - "SyntheticDataGenerationRequestWrapper", + "SupervisedFineTuneRequest", + "SyntheticDataGenerateRequest", "SyntheticDataGenerationResponse", "SystemMessage", "TokenLogProbs", @@ -6987,11 +6372,8 @@ "URL", "UpdateDocumentsRequest", "UpdateExperimentRequest", - "UpdateExperimentRequestWrapper", "UpdateRunRequest", - "UpdateRunRequestWrapper", "UploadArtifactRequest", - "UploadArtifactRequestWrapper", "UserMessage", "WolframAlphaToolDefinition" ] diff --git a/rfcs/RFC-0001-llama-stack-assets/llama-stack-spec.yaml b/rfcs/RFC-0001-llama-stack-assets/llama-stack-spec.yaml index 877639f51..b029f9adf 100644 --- a/rfcs/RFC-0001-llama-stack-assets/llama-stack-spec.yaml +++ b/rfcs/RFC-0001-llama-stack-assets/llama-stack-spec.yaml @@ -180,180 +180,6 @@ components: required: - step type: object - AgenticSystemTurnCreateRequest: - additionalProperties: false - properties: - agent_id: - type: string - attachments: - items: - $ref: '#/components/schemas/Attachment' - type: array - input_shields: - items: - $ref: '#/components/schemas/ShieldDefinition' - type: array - instructions: - type: string - messages: - items: - oneOf: - - $ref: '#/components/schemas/UserMessage' - - $ref: '#/components/schemas/ToolResponseMessage' - type: array - output_shields: - items: - $ref: '#/components/schemas/ShieldDefinition' - type: array - sampling_params: - $ref: '#/components/schemas/SamplingParams' - session_id: - type: string - stream: - type: boolean - tool_choice: - $ref: '#/components/schemas/ToolChoice' - tool_prompt_format: - $ref: '#/components/schemas/ToolPromptFormat' - tools: - items: - oneOf: - - $ref: '#/components/schemas/SearchToolDefinition' - - $ref: '#/components/schemas/WolframAlphaToolDefinition' - - $ref: '#/components/schemas/PhotogenToolDefinition' - - $ref: '#/components/schemas/CodeInterpreterToolDefinition' - - $ref: '#/components/schemas/FunctionCallToolDefinition' - - additionalProperties: false - properties: - input_shields: - items: - $ref: '#/components/schemas/ShieldDefinition' - type: array - max_chunks: - type: integer - max_tokens_in_context: - type: integer - memory_bank_configs: - items: - oneOf: - - additionalProperties: false - properties: - bank_id: - type: string - type: - const: vector - type: string - required: - - bank_id - - type - type: object - - additionalProperties: false - properties: - bank_id: - type: string - keys: - items: - type: string - type: array - type: - const: keyvalue - type: string - required: - - bank_id - - type - - keys - type: object - - additionalProperties: false - properties: - bank_id: - type: string - type: - const: keyword - type: string - required: - - bank_id - - type - type: object - - additionalProperties: false - properties: - bank_id: - type: string - entities: - items: - type: string - type: array - type: - const: graph - type: string - required: - - bank_id - - type - - entities - type: object - type: array - output_shields: - items: - $ref: '#/components/schemas/ShieldDefinition' - type: array - query_generator_config: - oneOf: - - additionalProperties: false - properties: - sep: - type: string - type: - const: default - type: string - required: - - type - - sep - type: object - - additionalProperties: false - properties: - model: - type: string - template: - type: string - type: - const: llm - type: string - required: - - type - - model - - template - type: object - - additionalProperties: false - properties: - type: - const: custom - type: string - required: - - type - type: object - type: - const: memory - type: string - required: - - type - - memory_bank_configs - - query_generator_config - - max_tokens_in_context - - max_chunks - type: object - type: array - required: - - agent_id - - session_id - - messages - type: object - AgenticSystemTurnCreateRequestWrapper: - additionalProperties: false - properties: - request: - $ref: '#/components/schemas/AgenticSystemTurnCreateRequest' - required: - - request - type: object AgenticSystemTurnResponseEvent: additionalProperties: false properties: @@ -574,14 +400,6 @@ components: - model - messages_batch type: object - BatchChatCompletionRequestWrapper: - additionalProperties: false - properties: - request: - $ref: '#/components/schemas/BatchChatCompletionRequest' - required: - - request - type: object BatchChatCompletionResponse: additionalProperties: false properties: @@ -617,14 +435,6 @@ components: - model - content_batch type: object - BatchCompletionRequestWrapper: - additionalProperties: false - properties: - request: - $ref: '#/components/schemas/BatchCompletionRequest' - required: - - request - type: object BatchCompletionResponse: additionalProperties: false properties: @@ -843,6 +653,30 @@ components: - agent_id - session_name type: object + CreateAgenticSystemTurnRequest: + additionalProperties: false + properties: + agent_id: + type: string + attachments: + items: + $ref: '#/components/schemas/Attachment' + type: array + messages: + items: + oneOf: + - $ref: '#/components/schemas/UserMessage' + - $ref: '#/components/schemas/ToolResponseMessage' + type: array + session_id: + type: string + stream: + type: boolean + required: + - agent_id + - session_id + - messages + type: object CreateDatasetRequest: additionalProperties: false properties: @@ -853,15 +687,6 @@ components: required: - uuid - dataset - title: Request to create a dataset. - type: object - CreateDatasetRequestWrapper: - additionalProperties: false - properties: - request: - $ref: '#/components/schemas/CreateDatasetRequest' - required: - - request type: object CreateExperimentRequest: additionalProperties: false @@ -881,14 +706,6 @@ components: required: - name type: object - CreateExperimentRequestWrapper: - additionalProperties: false - properties: - request: - $ref: '#/components/schemas/CreateExperimentRequest' - required: - - request - type: object CreateMemoryBankRequest: additionalProperties: false properties: @@ -960,14 +777,6 @@ components: required: - experiment_id type: object - CreateRunRequestWrapper: - additionalProperties: false - properties: - request: - $ref: '#/components/schemas/CreateRunRequest' - required: - - request - type: object DPOAlignmentConfig: additionalProperties: false properties: @@ -1110,12 +919,6 @@ components: EvaluateQuestionAnsweringRequest: additionalProperties: false properties: - checkpoint: - $ref: '#/components/schemas/Checkpoint' - dataset: - $ref: '#/components/schemas/TrainEvalDataset' - job_uuid: - type: string metrics: items: enum: @@ -1123,33 +926,12 @@ components: - f1 type: string type: array - sampling_params: - $ref: '#/components/schemas/SamplingParams' required: - - job_uuid - - dataset - - checkpoint - - sampling_params - metrics - title: Request to evaluate question answering. - type: object - EvaluateQuestionAnsweringRequestWrapper: - additionalProperties: false - properties: - request: - $ref: '#/components/schemas/EvaluateQuestionAnsweringRequest' - required: - - request type: object EvaluateSummarizationRequest: additionalProperties: false properties: - checkpoint: - $ref: '#/components/schemas/Checkpoint' - dataset: - $ref: '#/components/schemas/TrainEvalDataset' - job_uuid: - type: string metrics: items: enum: @@ -1157,33 +939,12 @@ components: - bleu type: string type: array - sampling_params: - $ref: '#/components/schemas/SamplingParams' required: - - job_uuid - - dataset - - checkpoint - - sampling_params - metrics - title: Request to evaluate summarization. - type: object - EvaluateSummarizationRequestWrapper: - additionalProperties: false - properties: - request: - $ref: '#/components/schemas/EvaluateSummarizationRequest' - required: - - request type: object EvaluateTextGenerationRequest: additionalProperties: false properties: - checkpoint: - $ref: '#/components/schemas/Checkpoint' - dataset: - $ref: '#/components/schemas/TrainEvalDataset' - job_uuid: - type: string metrics: items: enum: @@ -1192,23 +953,8 @@ components: - bleu type: string type: array - sampling_params: - $ref: '#/components/schemas/SamplingParams' required: - - job_uuid - - dataset - - checkpoint - - sampling_params - metrics - title: Request to evaluate text generation. - type: object - EvaluateTextGenerationRequestWrapper: - additionalProperties: false - properties: - request: - $ref: '#/components/schemas/EvaluateTextGenerationRequest' - required: - - request type: object EvaluationJob: additionalProperties: false @@ -1338,6 +1084,20 @@ components: required: - document_ids type: object + GetLogsRequest: + additionalProperties: false + properties: + filters: + additionalProperties: + oneOf: + - type: 'null' + - type: boolean + - type: number + - type: string + - type: array + - type: object + type: object + type: object InferenceStep: additionalProperties: false properties: @@ -1423,14 +1183,6 @@ components: required: - logs type: object - LogMessagesRequestWrapper: - additionalProperties: false - properties: - request: - $ref: '#/components/schemas/LogMessagesRequest' - required: - - request - type: object LogMetricsRequest: additionalProperties: false properties: @@ -1444,40 +1196,6 @@ components: - run_id - metrics type: object - LogMetricsRequestWrapper: - additionalProperties: false - properties: - request: - $ref: '#/components/schemas/LogMetricsRequest' - required: - - request - type: object - LogSearchRequest: - additionalProperties: false - properties: - filters: - additionalProperties: - oneOf: - - type: 'null' - - type: boolean - - type: number - - type: string - - type: array - - type: object - type: object - query: - type: string - required: - - query - type: object - LogSearchRequestWrapper: - additionalProperties: false - properties: - request: - $ref: '#/components/schemas/LogSearchRequest' - required: - - request - type: object LoraFinetuningConfig: additionalProperties: false properties: @@ -1766,7 +1484,7 @@ components: - checkpoints title: Status of a finetuning job. type: object - PostTrainingRLHFRequest: + PreferenceOptimizeRequest: additionalProperties: false properties: algorithm: @@ -1816,78 +1534,6 @@ components: - training_config - hyperparam_search_config - logger_config - title: Request to finetune a model. - type: object - PostTrainingRLHFRequestWrapper: - additionalProperties: false - properties: - request: - $ref: '#/components/schemas/PostTrainingRLHFRequest' - required: - - request - type: object - PostTrainingSFTRequest: - additionalProperties: false - properties: - algorithm: - $ref: '#/components/schemas/FinetuningAlgorithm' - algorithm_config: - oneOf: - - $ref: '#/components/schemas/LoraFinetuningConfig' - - $ref: '#/components/schemas/QLoraFinetuningConfig' - - $ref: '#/components/schemas/DoraFinetuningConfig' - dataset: - $ref: '#/components/schemas/TrainEvalDataset' - hyperparam_search_config: - additionalProperties: - oneOf: - - type: 'null' - - type: boolean - - type: number - - type: string - - type: array - - type: object - type: object - job_uuid: - type: string - logger_config: - additionalProperties: - oneOf: - - type: 'null' - - type: boolean - - type: number - - type: string - - type: array - - type: object - type: object - model: - type: string - optimizer_config: - $ref: '#/components/schemas/OptimizerConfig' - training_config: - $ref: '#/components/schemas/TrainingConfig' - validation_dataset: - $ref: '#/components/schemas/TrainEvalDataset' - required: - - job_uuid - - model - - dataset - - validation_dataset - - algorithm - - algorithm_config - - optimizer_config - - training_config - - hyperparam_search_config - - logger_config - title: Request to finetune a model. - type: object - PostTrainingSFTRequestWrapper: - additionalProperties: false - properties: - request: - $ref: '#/components/schemas/PostTrainingSFTRequest' - required: - - request type: object QLoraFinetuningConfig: additionalProperties: false @@ -2019,7 +1665,7 @@ components: - PUT - DELETE type: string - RewardScoringRequest: + RewardScoreRequest: additionalProperties: false properties: dialog_generations: @@ -2031,16 +1677,6 @@ components: required: - dialog_generations - model - title: Request to score a reward function. A list of prompts and a list of responses - per prompt. - type: object - RewardScoringRequestWrapper: - additionalProperties: false - properties: - request: - $ref: '#/components/schemas/RewardScoringRequest' - required: - - request type: object RewardScoringResponse: additionalProperties: false @@ -2086,7 +1722,17 @@ components: - started_at - metadata type: object - RunShieldRequest: + RunShieldResponse: + additionalProperties: false + properties: + responses: + items: + $ref: '#/components/schemas/ShieldResponse' + type: array + required: + - responses + type: object + RunShieldsRequest: additionalProperties: false properties: messages: @@ -2105,24 +1751,6 @@ components: - messages - shields type: object - RunShieldRequestWrapper: - additionalProperties: false - properties: - request: - $ref: '#/components/schemas/RunShieldRequest' - required: - - request - type: object - RunShieldResponse: - additionalProperties: false - properties: - responses: - items: - $ref: '#/components/schemas/ShieldResponse' - type: array - required: - - responses - type: object SamplingParams: additionalProperties: false properties: @@ -2297,7 +1925,61 @@ components: - end_of_message - out_of_tokens type: string - SyntheticDataGenerationRequest: + SupervisedFineTuneRequest: + additionalProperties: false + properties: + algorithm: + $ref: '#/components/schemas/FinetuningAlgorithm' + algorithm_config: + oneOf: + - $ref: '#/components/schemas/LoraFinetuningConfig' + - $ref: '#/components/schemas/QLoraFinetuningConfig' + - $ref: '#/components/schemas/DoraFinetuningConfig' + dataset: + $ref: '#/components/schemas/TrainEvalDataset' + hyperparam_search_config: + additionalProperties: + oneOf: + - type: 'null' + - type: boolean + - type: number + - type: string + - type: array + - type: object + type: object + job_uuid: + type: string + logger_config: + additionalProperties: + oneOf: + - type: 'null' + - type: boolean + - type: number + - type: string + - type: array + - type: object + type: object + model: + type: string + optimizer_config: + $ref: '#/components/schemas/OptimizerConfig' + training_config: + $ref: '#/components/schemas/TrainingConfig' + validation_dataset: + $ref: '#/components/schemas/TrainEvalDataset' + required: + - job_uuid + - model + - dataset + - validation_dataset + - algorithm + - algorithm_config + - optimizer_config + - training_config + - hyperparam_search_config + - logger_config + type: object + SyntheticDataGenerateRequest: additionalProperties: false properties: dialogs: @@ -2323,16 +2005,6 @@ components: required: - dialogs - filtering_function - title: Request to generate synthetic data. A small batch of prompts and a filtering - function - type: object - SyntheticDataGenerationRequestWrapper: - additionalProperties: false - properties: - request: - $ref: '#/components/schemas/SyntheticDataGenerationRequest' - required: - - request type: object SyntheticDataGenerationResponse: additionalProperties: false @@ -2702,14 +2374,6 @@ components: required: - experiment_id type: object - UpdateExperimentRequestWrapper: - additionalProperties: false - properties: - request: - $ref: '#/components/schemas/UpdateExperimentRequest' - required: - - request - type: object UpdateRunRequest: additionalProperties: false properties: @@ -2733,14 +2397,6 @@ components: required: - run_id type: object - UpdateRunRequestWrapper: - additionalProperties: false - properties: - request: - $ref: '#/components/schemas/UpdateRunRequest' - required: - - request - type: object UploadArtifactRequest: additionalProperties: false properties: @@ -2769,14 +2425,6 @@ components: - artifact_type - content type: object - UploadArtifactRequestWrapper: - additionalProperties: false - properties: - request: - $ref: '#/components/schemas/UploadArtifactRequest' - required: - - request - type: object UserMessage: additionalProperties: false properties: @@ -2822,7 +2470,7 @@ info: description: "This is the specification of the llama stack that provides\n \ \ a set of endpoints and their corresponding interfaces that are tailored\ \ to\n best leverage Llama Models. The specification is still in\ - \ draft and subject to change.\n Generated at 2024-09-11 12:34:17.939867" + \ draft and subject to change.\n Generated at 2024-09-11 14:17:44.361462" title: '[DRAFT] Llama Stack Specification' version: 0.0.1 jsonSchemaDialect: https://json-schema.org/draft/2020-12/schema @@ -2954,7 +2602,7 @@ paths: content: application/json: schema: - $ref: '#/components/schemas/AgenticSystemTurnCreateRequestWrapper' + $ref: '#/components/schemas/CreateAgenticSystemTurnRequest' required: true responses: '200': @@ -3011,7 +2659,7 @@ paths: content: application/json: schema: - $ref: '#/components/schemas/BatchChatCompletionRequestWrapper' + $ref: '#/components/schemas/BatchChatCompletionRequest' required: true responses: '200': @@ -3029,7 +2677,7 @@ paths: content: application/json: schema: - $ref: '#/components/schemas/BatchCompletionRequestWrapper' + $ref: '#/components/schemas/BatchCompletionRequest' required: true responses: '200': @@ -3047,7 +2695,7 @@ paths: content: application/json: schema: - $ref: '#/components/schemas/CreateDatasetRequestWrapper' + $ref: '#/components/schemas/CreateDatasetRequest' required: true responses: '200': @@ -3169,7 +2817,7 @@ paths: content: application/json: schema: - $ref: '#/components/schemas/EvaluateQuestionAnsweringRequestWrapper' + $ref: '#/components/schemas/EvaluateQuestionAnsweringRequest' required: true responses: '200': @@ -3187,7 +2835,7 @@ paths: content: application/json: schema: - $ref: '#/components/schemas/EvaluateSummarizationRequestWrapper' + $ref: '#/components/schemas/EvaluateSummarizationRequest' required: true responses: '200': @@ -3205,7 +2853,7 @@ paths: content: application/json: schema: - $ref: '#/components/schemas/EvaluateTextGenerationRequestWrapper' + $ref: '#/components/schemas/EvaluateTextGenerationRequest' required: true responses: '200': @@ -3241,7 +2889,7 @@ paths: content: application/json: schema: - $ref: '#/components/schemas/UploadArtifactRequestWrapper' + $ref: '#/components/schemas/UploadArtifactRequest' required: true responses: '200': @@ -3259,7 +2907,7 @@ paths: content: application/json: schema: - $ref: '#/components/schemas/CreateExperimentRequestWrapper' + $ref: '#/components/schemas/CreateExperimentRequest' required: true responses: '200': @@ -3277,7 +2925,7 @@ paths: content: application/json: schema: - $ref: '#/components/schemas/CreateRunRequestWrapper' + $ref: '#/components/schemas/CreateRunRequest' required: true responses: '200': @@ -3324,7 +2972,7 @@ paths: content: application/json: schema: - $ref: '#/components/schemas/UpdateExperimentRequestWrapper' + $ref: '#/components/schemas/UpdateExperimentRequest' required: true responses: '200': @@ -3391,12 +3039,17 @@ paths: - Inference /logging/get_logs: post: - parameters: [] + parameters: + - in: query + name: query + required: true + schema: + type: string requestBody: content: application/json: schema: - $ref: '#/components/schemas/LogSearchRequestWrapper' + $ref: '#/components/schemas/GetLogsRequest' required: true responses: '200': @@ -3414,7 +3067,7 @@ paths: content: application/json: schema: - $ref: '#/components/schemas/LogMessagesRequestWrapper' + $ref: '#/components/schemas/LogMessagesRequest' required: true responses: '200': @@ -3655,7 +3308,7 @@ paths: content: application/json: schema: - $ref: '#/components/schemas/PostTrainingRLHFRequestWrapper' + $ref: '#/components/schemas/PreferenceOptimizeRequest' required: true responses: '200': @@ -3673,7 +3326,7 @@ paths: content: application/json: schema: - $ref: '#/components/schemas/PostTrainingSFTRequestWrapper' + $ref: '#/components/schemas/SupervisedFineTuneRequest' required: true responses: '200': @@ -3691,7 +3344,7 @@ paths: content: application/json: schema: - $ref: '#/components/schemas/RewardScoringRequestWrapper' + $ref: '#/components/schemas/RewardScoreRequest' required: true responses: '200': @@ -3709,7 +3362,7 @@ paths: content: application/json: schema: - $ref: '#/components/schemas/LogMetricsRequestWrapper' + $ref: '#/components/schemas/LogMetricsRequest' required: true responses: '200': @@ -3740,7 +3393,7 @@ paths: content: application/json: schema: - $ref: '#/components/schemas/UpdateRunRequestWrapper' + $ref: '#/components/schemas/UpdateRunRequest' required: true responses: '200': @@ -3758,7 +3411,7 @@ paths: content: application/json: schema: - $ref: '#/components/schemas/RunShieldRequestWrapper' + $ref: '#/components/schemas/RunShieldsRequest' required: true responses: '200': @@ -3776,7 +3429,7 @@ paths: content: application/json: schema: - $ref: '#/components/schemas/SyntheticDataGenerationRequestWrapper' + $ref: '#/components/schemas/SyntheticDataGenerateRequest' required: true responses: '200': @@ -3792,20 +3445,17 @@ security: servers: - url: http://any-hosted-llama-stack.com tags: -- name: PostTraining -- name: RewardScoring -- name: Safety -- name: Memory -- name: SyntheticDataGeneration -- name: BatchInference -- name: AgenticSystem - name: Telemetry - name: Evaluations -- name: Inference +- name: PostTraining - name: Datasets -- description: - name: BatchChatCompletionRequest +- name: SyntheticDataGeneration +- name: BatchInference +- name: Inference +- name: AgenticSystem +- name: Safety +- name: Memory +- name: RewardScoring - description: name: BuiltinTool - description: name: UserMessage -- description: - name: BatchChatCompletionRequestWrapper + name: BatchChatCompletionRequest - description: name: BatchChatCompletionResponse - description: name: BatchCompletionRequest -- description: - name: BatchCompletionRequestWrapper - description: name: BatchCompletionResponse @@ -3944,14 +3591,11 @@ tags: - description: name: AgenticSystemSessionCreateResponse -- description: - name: AgenticSystemTurnCreateRequest - description: name: Attachment -- description: - name: AgenticSystemTurnCreateRequestWrapper + name: CreateAgenticSystemTurnRequest - description: 'Streamed agent execution response. @@ -3995,11 +3639,6 @@ tags: ' name: Turn -- description: 'Request to create a dataset. - - - ' - name: CreateDatasetRequest - description: 'Dataset to be used for training or evaluating language models. @@ -4008,15 +3647,12 @@ tags: - description: name: TrainEvalDatasetColumnType -- description: - name: CreateDatasetRequestWrapper + name: CreateDatasetRequest - description: name: CreateExperimentRequest -- description: - name: CreateExperimentRequestWrapper - description: name: Experiment - description: name: CreateRunRequest -- description: - name: CreateRunRequestWrapper - description: name: Run - description: name: EmbeddingsResponse -- description: 'Checkpoint created during training runs - - - ' - name: Checkpoint -- description: 'Request to evaluate question answering. - - - ' - name: EvaluateQuestionAnsweringRequest -- description: - name: EvaluateQuestionAnsweringRequestWrapper + name: EvaluateQuestionAnsweringRequest - description: name: EvaluationJob -- description: 'Request to evaluate summarization. - - - ' +- description: name: EvaluateSummarizationRequest -- description: - name: EvaluateSummarizationRequestWrapper -- description: 'Request to evaluate text generation. - - - ' name: EvaluateTextGenerationRequest -- description: - name: EvaluateTextGenerationRequestWrapper - description: name: GetAgenticSystemSessionRequest @@ -4123,16 +3733,17 @@ tags: - description: name: EvaluationJobStatusResponse -- description: - name: LogSearchRequest -- description: - name: LogSearchRequestWrapper +- description: + name: GetLogsRequest - description: name: Log - description: name: Metric +- description: 'Checkpoint created during training runs + + + ' + name: Checkpoint - description: 'Artifacts of a finetuning job. @@ -4165,33 +3776,22 @@ tags: - description: name: LogMessagesRequest -- description: - name: LogMessagesRequestWrapper - description: name: LogMetricsRequest -- description: - name: LogMetricsRequestWrapper - description: name: DPOAlignmentConfig - description: name: OptimizerConfig -- description: 'Request to finetune a model. - - - ' - name: PostTrainingRLHFRequest - description: name: RLHFAlgorithm - description: name: TrainingConfig -- description: - name: PostTrainingRLHFRequestWrapper + name: PreferenceOptimizeRequest - description: name: QueryDocumentsRequest @@ -4201,15 +3801,9 @@ tags: - description: name: DialogGenerations -- description: 'Request to score a reward function. A list of prompts and a list of - responses per prompt. - - - ' - name: RewardScoringRequest -- description: - name: RewardScoringRequestWrapper + name: RewardScoreRequest - description: 'Response from the reward scoring. Batch of (prompt, response, score) tuples that pass the threshold. @@ -4221,12 +3815,9 @@ tags: name: ScoredDialogGenerations - description: name: ScoredMessage -- description: - name: RunShieldRequest -- description: - name: RunShieldRequestWrapper + name: RunShieldsRequest - description: name: RunShieldResponse @@ -4239,27 +3830,15 @@ tags: - description: name: LoraFinetuningConfig -- description: 'Request to finetune a model. - - - ' - name: PostTrainingSFTRequest - description: name: QLoraFinetuningConfig -- description: - name: PostTrainingSFTRequestWrapper -- description: 'Request to generate synthetic data. A small batch of prompts and a - filtering function - - - ' - name: SyntheticDataGenerationRequest -- description: - name: SyntheticDataGenerationRequestWrapper + name: SyntheticDataGenerateRequest - description: 'Response from the synthetic data generation. Batch of (prompt, response, score) tuples that pass the threshold. @@ -4273,21 +3852,12 @@ tags: - description: name: UpdateExperimentRequest -- description: - name: UpdateExperimentRequestWrapper - description: name: UpdateRunRequest -- description: - name: UpdateRunRequestWrapper - description: name: UploadArtifactRequest -- description: - name: UploadArtifactRequestWrapper x-tagGroups: - name: Operations tags: @@ -4308,8 +3878,6 @@ x-tagGroups: - AgenticSystemCreateResponse - AgenticSystemSessionCreateResponse - AgenticSystemStepResponse - - AgenticSystemTurnCreateRequest - - AgenticSystemTurnCreateRequestWrapper - AgenticSystemTurnResponseEvent - AgenticSystemTurnResponseStepCompletePayload - AgenticSystemTurnResponseStepProgressPayload @@ -4321,10 +3889,8 @@ x-tagGroups: - ArtifactType - Attachment - BatchChatCompletionRequest - - BatchChatCompletionRequestWrapper - BatchChatCompletionResponse - BatchCompletionRequest - - BatchCompletionRequestWrapper - BatchCompletionResponse - BuiltinShield - BuiltinTool @@ -4341,13 +3907,11 @@ x-tagGroups: - CompletionResponseStreamChunk - CreateAgenticSystemRequest - CreateAgenticSystemSessionRequest + - CreateAgenticSystemTurnRequest - CreateDatasetRequest - - CreateDatasetRequestWrapper - CreateExperimentRequest - - CreateExperimentRequestWrapper - CreateMemoryBankRequest - CreateRunRequest - - CreateRunRequestWrapper - DPOAlignmentConfig - DeleteAgenticSystemRequest - DeleteAgenticSystemSessionRequest @@ -4359,11 +3923,8 @@ x-tagGroups: - EmbeddingsRequest - EmbeddingsResponse - EvaluateQuestionAnsweringRequest - - EvaluateQuestionAnsweringRequestWrapper - EvaluateSummarizationRequest - - EvaluateSummarizationRequestWrapper - EvaluateTextGenerationRequest - - EvaluateTextGenerationRequestWrapper - EvaluationJob - EvaluationJobArtifactsResponse - EvaluationJobLogStream @@ -4374,16 +3935,13 @@ x-tagGroups: - FunctionCallToolDefinition - GetAgenticSystemSessionRequest - GetDocumentsRequest + - GetLogsRequest - InferenceStep - InsertDocumentsRequest - ListArtifactsRequest - Log - LogMessagesRequest - - LogMessagesRequestWrapper - LogMetricsRequest - - LogMetricsRequestWrapper - - LogSearchRequest - - LogSearchRequestWrapper - LoraFinetuningConfig - MemoryBank - MemoryBankDocument @@ -4397,23 +3955,18 @@ x-tagGroups: - PostTrainingJobLogStream - PostTrainingJobStatus - PostTrainingJobStatusResponse - - PostTrainingRLHFRequest - - PostTrainingRLHFRequestWrapper - - PostTrainingSFTRequest - - PostTrainingSFTRequestWrapper + - PreferenceOptimizeRequest - QLoraFinetuningConfig - QueryDocumentsRequest - QueryDocumentsResponse - RLHFAlgorithm - RestAPIExecutionConfig - RestAPIMethod - - RewardScoringRequest - - RewardScoringRequestWrapper + - RewardScoreRequest - RewardScoringResponse - Run - - RunShieldRequest - - RunShieldRequestWrapper - RunShieldResponse + - RunShieldsRequest - SamplingParams - SamplingStrategy - ScoredDialogGenerations @@ -4424,8 +3977,8 @@ x-tagGroups: - ShieldDefinition - ShieldResponse - StopReason - - SyntheticDataGenerationRequest - - SyntheticDataGenerationRequestWrapper + - SupervisedFineTuneRequest + - SyntheticDataGenerateRequest - SyntheticDataGenerationResponse - SystemMessage - TokenLogProbs @@ -4446,10 +3999,7 @@ x-tagGroups: - URL - UpdateDocumentsRequest - UpdateExperimentRequest - - UpdateExperimentRequestWrapper - UpdateRunRequest - - UpdateRunRequestWrapper - UploadArtifactRequest - - UploadArtifactRequestWrapper - UserMessage - WolframAlphaToolDefinition