forked from phoenix-oss/llama-stack-mirror
		
	feat(1/n): api: unify agents for handling server & client tools (#1178)
# Problem
Our current Agent framework has discrepancies in definition on how we
handle server side and client side tools.
1. Server Tools: a single Turn is returned including `ToolExecutionStep`
in agenst
2. Client Tools: `create_agent_turn` is called in loop with client agent
lib yielding the agent chunk
ad6ffc63df/src/llama_stack_client/lib/agents/agent.py (L186-L211)
This makes it inconsistent to work with server & client tools. It also
complicates the logs to telemetry to get information about agents turn /
history for observability.
#### Principle
The same `turn_id` should be used to represent the steps required to
complete a user message including client tools.
## Solution
1. `AgentTurnResponseEventType.turn_awaiting_input` status to indicate
that the current turn is not completed, and awaiting tool input
2. `continue_agent_turn` endpoint to update agent turn with client's
tool response.
# What does this PR do?
- Skeleton API as example
## Test Plan
[Describe the tests you ran to verify your changes with result
summaries. *Provide clear instructions so the plan can be easily
re-executed.*]
- Just API update, no functionality change
```
llama stack run + client-sdk test
```
<img width="842" alt="image"
src="https://github.com/user-attachments/assets/7ac56b5f-f424-4632-9476-7e0f57555bc3"
/>
[//]: # (## Documentation)
			
			
This commit is contained in:
		
							parent
							
								
									992f865b2e
								
							
						
					
					
						commit
						0fe071764f
					
				
					 7 changed files with 454 additions and 21 deletions
				
			
		
							
								
								
									
										113
									
								
								docs/_static/llama-stack-spec.html
									
										
									
									
										vendored
									
									
								
							
							
						
						
									
										113
									
								
								docs/_static/llama-stack-spec.html
									
										
									
									
										vendored
									
									
								
							|  | @ -2315,6 +2315,70 @@ | |||
|                 } | ||||
|             } | ||||
|         }, | ||||
|         "/v1/agents/{agent_id}/session/{session_id}/turn/{turn_id}/resume": { | ||||
|             "post": { | ||||
|                 "responses": { | ||||
|                     "200": { | ||||
|                         "description": "A Turn object if stream is False, otherwise an AsyncIterator of AgentTurnResponseStreamChunk objects.", | ||||
|                         "content": { | ||||
|                             "application/json": { | ||||
|                                 "schema": { | ||||
|                                     "$ref": "#/components/schemas/Turn" | ||||
|                                 } | ||||
|                             }, | ||||
|                             "text/event-stream": { | ||||
|                                 "schema": { | ||||
|                                     "$ref": "#/components/schemas/AgentTurnResponseStreamChunk" | ||||
|                                 } | ||||
|                             } | ||||
|                         } | ||||
|                     } | ||||
|                 }, | ||||
|                 "tags": [ | ||||
|                     "Agents" | ||||
|                 ], | ||||
|                 "description": "Resume an agent turn with executed tool call responses.\nWhen a Turn has the status `awaiting_input` due to pending input from client side tool calls, this endpoint can be used to submit the outputs from the tool calls once they are ready.", | ||||
|                 "parameters": [ | ||||
|                     { | ||||
|                         "name": "agent_id", | ||||
|                         "in": "path", | ||||
|                         "description": "The ID of the agent to resume.", | ||||
|                         "required": true, | ||||
|                         "schema": { | ||||
|                             "type": "string" | ||||
|                         } | ||||
|                     }, | ||||
|                     { | ||||
|                         "name": "session_id", | ||||
|                         "in": "path", | ||||
|                         "description": "The ID of the session to resume.", | ||||
|                         "required": true, | ||||
|                         "schema": { | ||||
|                             "type": "string" | ||||
|                         } | ||||
|                     }, | ||||
|                     { | ||||
|                         "name": "turn_id", | ||||
|                         "in": "path", | ||||
|                         "description": "The ID of the turn to resume.", | ||||
|                         "required": true, | ||||
|                         "schema": { | ||||
|                             "type": "string" | ||||
|                         } | ||||
|                     } | ||||
|                 ], | ||||
|                 "requestBody": { | ||||
|                     "content": { | ||||
|                         "application/json": { | ||||
|                             "schema": { | ||||
|                                 "$ref": "#/components/schemas/ResumeAgentTurnRequest" | ||||
|                             } | ||||
|                         } | ||||
|                     }, | ||||
|                     "required": true | ||||
|                 } | ||||
|             } | ||||
|         }, | ||||
|         "/v1/eval/benchmarks/{benchmark_id}/jobs": { | ||||
|             "post": { | ||||
|                 "responses": { | ||||
|  | @ -4226,6 +4290,9 @@ | |||
|                     }, | ||||
|                     "tool_config": { | ||||
|                         "$ref": "#/components/schemas/ToolConfig" | ||||
|                     }, | ||||
|                     "allow_turn_resume": { | ||||
|                         "type": "boolean" | ||||
|                     } | ||||
|                 }, | ||||
|                 "additionalProperties": false, | ||||
|  | @ -4612,6 +4679,9 @@ | |||
|                     }, | ||||
|                     { | ||||
|                         "$ref": "#/components/schemas/AgentTurnResponseTurnCompletePayload" | ||||
|                     }, | ||||
|                     { | ||||
|                         "$ref": "#/components/schemas/AgentTurnResponseTurnAwaitingInputPayload" | ||||
|                     } | ||||
|                 ], | ||||
|                 "discriminator": { | ||||
|  | @ -4621,7 +4691,8 @@ | |||
|                         "step_progress": "#/components/schemas/AgentTurnResponseStepProgressPayload", | ||||
|                         "step_complete": "#/components/schemas/AgentTurnResponseStepCompletePayload", | ||||
|                         "turn_start": "#/components/schemas/AgentTurnResponseTurnStartPayload", | ||||
|                         "turn_complete": "#/components/schemas/AgentTurnResponseTurnCompletePayload" | ||||
|                         "turn_complete": "#/components/schemas/AgentTurnResponseTurnCompletePayload", | ||||
|                         "turn_awaiting_input": "#/components/schemas/AgentTurnResponseTurnAwaitingInputPayload" | ||||
|                     } | ||||
|                 } | ||||
|             }, | ||||
|  | @ -4784,6 +4855,25 @@ | |||
|                 "title": "AgentTurnResponseStreamChunk", | ||||
|                 "description": "streamed agent turn completion response." | ||||
|             }, | ||||
|             "AgentTurnResponseTurnAwaitingInputPayload": { | ||||
|                 "type": "object", | ||||
|                 "properties": { | ||||
|                     "event_type": { | ||||
|                         "type": "string", | ||||
|                         "const": "turn_awaiting_input", | ||||
|                         "default": "turn_awaiting_input" | ||||
|                     }, | ||||
|                     "turn": { | ||||
|                         "$ref": "#/components/schemas/Turn" | ||||
|                     } | ||||
|                 }, | ||||
|                 "additionalProperties": false, | ||||
|                 "required": [ | ||||
|                     "event_type", | ||||
|                     "turn" | ||||
|                 ], | ||||
|                 "title": "AgentTurnResponseTurnAwaitingInputPayload" | ||||
|             }, | ||||
|             "AgentTurnResponseTurnCompletePayload": { | ||||
|                 "type": "object", | ||||
|                 "properties": { | ||||
|  | @ -8046,6 +8136,27 @@ | |||
|                 ], | ||||
|                 "title": "RegisterVectorDbRequest" | ||||
|             }, | ||||
|             "ResumeAgentTurnRequest": { | ||||
|                 "type": "object", | ||||
|                 "properties": { | ||||
|                     "tool_responses": { | ||||
|                         "type": "array", | ||||
|                         "items": { | ||||
|                             "$ref": "#/components/schemas/ToolResponseMessage" | ||||
|                         }, | ||||
|                         "description": "The tool call responses to resume the turn with." | ||||
|                     }, | ||||
|                     "stream": { | ||||
|                         "type": "boolean", | ||||
|                         "description": "Whether to stream the response." | ||||
|                     } | ||||
|                 }, | ||||
|                 "additionalProperties": false, | ||||
|                 "required": [ | ||||
|                     "tool_responses" | ||||
|                 ], | ||||
|                 "title": "ResumeAgentTurnRequest" | ||||
|             }, | ||||
|             "RunEvalRequest": { | ||||
|                 "type": "object", | ||||
|                 "properties": { | ||||
|  |  | |||
							
								
								
									
										82
									
								
								docs/_static/llama-stack-spec.yaml
									
										
									
									
										vendored
									
									
								
							
							
						
						
									
										82
									
								
								docs/_static/llama-stack-spec.yaml
									
										
									
									
										vendored
									
									
								
							|  | @ -1401,6 +1401,53 @@ paths: | |||
|             schema: | ||||
|               $ref: '#/components/schemas/QueryTracesRequest' | ||||
|         required: true | ||||
|   /v1/agents/{agent_id}/session/{session_id}/turn/{turn_id}/resume: | ||||
|     post: | ||||
|       responses: | ||||
|         '200': | ||||
|           description: >- | ||||
|             A Turn object if stream is False, otherwise an AsyncIterator of AgentTurnResponseStreamChunk | ||||
|             objects. | ||||
|           content: | ||||
|             application/json: | ||||
|               schema: | ||||
|                 $ref: '#/components/schemas/Turn' | ||||
|             text/event-stream: | ||||
|               schema: | ||||
|                 $ref: '#/components/schemas/AgentTurnResponseStreamChunk' | ||||
|       tags: | ||||
|         - Agents | ||||
|       description: >- | ||||
|         Resume an agent turn with executed tool call responses. | ||||
| 
 | ||||
|         When a Turn has the status `awaiting_input` due to pending input from client | ||||
|         side tool calls, this endpoint can be used to submit the outputs from the | ||||
|         tool calls once they are ready. | ||||
|       parameters: | ||||
|         - name: agent_id | ||||
|           in: path | ||||
|           description: The ID of the agent to resume. | ||||
|           required: true | ||||
|           schema: | ||||
|             type: string | ||||
|         - name: session_id | ||||
|           in: path | ||||
|           description: The ID of the session to resume. | ||||
|           required: true | ||||
|           schema: | ||||
|             type: string | ||||
|         - name: turn_id | ||||
|           in: path | ||||
|           description: The ID of the turn to resume. | ||||
|           required: true | ||||
|           schema: | ||||
|             type: string | ||||
|       requestBody: | ||||
|         content: | ||||
|           application/json: | ||||
|             schema: | ||||
|               $ref: '#/components/schemas/ResumeAgentTurnRequest' | ||||
|         required: true | ||||
|   /v1/eval/benchmarks/{benchmark_id}/jobs: | ||||
|     post: | ||||
|       responses: | ||||
|  | @ -2740,6 +2787,8 @@ components: | |||
|             $ref: '#/components/schemas/AgentTool' | ||||
|         tool_config: | ||||
|           $ref: '#/components/schemas/ToolConfig' | ||||
|         allow_turn_resume: | ||||
|           type: boolean | ||||
|       additionalProperties: false | ||||
|       required: | ||||
|         - messages | ||||
|  | @ -2992,6 +3041,7 @@ components: | |||
|         - $ref: '#/components/schemas/AgentTurnResponseStepCompletePayload' | ||||
|         - $ref: '#/components/schemas/AgentTurnResponseTurnStartPayload' | ||||
|         - $ref: '#/components/schemas/AgentTurnResponseTurnCompletePayload' | ||||
|         - $ref: '#/components/schemas/AgentTurnResponseTurnAwaitingInputPayload' | ||||
|       discriminator: | ||||
|         propertyName: event_type | ||||
|         mapping: | ||||
|  | @ -3000,6 +3050,7 @@ components: | |||
|           step_complete: '#/components/schemas/AgentTurnResponseStepCompletePayload' | ||||
|           turn_start: '#/components/schemas/AgentTurnResponseTurnStartPayload' | ||||
|           turn_complete: '#/components/schemas/AgentTurnResponseTurnCompletePayload' | ||||
|           turn_awaiting_input: '#/components/schemas/AgentTurnResponseTurnAwaitingInputPayload' | ||||
|     AgentTurnResponseStepCompletePayload: | ||||
|       type: object | ||||
|       properties: | ||||
|  | @ -3106,6 +3157,21 @@ components: | |||
|         - event | ||||
|       title: AgentTurnResponseStreamChunk | ||||
|       description: streamed agent turn completion response. | ||||
|     "AgentTurnResponseTurnAwaitingInputPayload": | ||||
|       type: object | ||||
|       properties: | ||||
|         event_type: | ||||
|           type: string | ||||
|           const: turn_awaiting_input | ||||
|           default: turn_awaiting_input | ||||
|         turn: | ||||
|           $ref: '#/components/schemas/Turn' | ||||
|       additionalProperties: false | ||||
|       required: | ||||
|         - event_type | ||||
|         - turn | ||||
|       title: >- | ||||
|         AgentTurnResponseTurnAwaitingInputPayload | ||||
|     AgentTurnResponseTurnCompletePayload: | ||||
|       type: object | ||||
|       properties: | ||||
|  | @ -5205,6 +5271,22 @@ components: | |||
|         - vector_db_id | ||||
|         - embedding_model | ||||
|       title: RegisterVectorDbRequest | ||||
|     ResumeAgentTurnRequest: | ||||
|       type: object | ||||
|       properties: | ||||
|         tool_responses: | ||||
|           type: array | ||||
|           items: | ||||
|             $ref: '#/components/schemas/ToolResponseMessage' | ||||
|           description: >- | ||||
|             The tool call responses to resume the turn with. | ||||
|         stream: | ||||
|           type: boolean | ||||
|           description: Whether to stream the response. | ||||
|       additionalProperties: false | ||||
|       required: | ||||
|         - tool_responses | ||||
|       title: ResumeAgentTurnRequest | ||||
|     RunEvalRequest: | ||||
|       type: object | ||||
|       properties: | ||||
|  |  | |||
		Loading…
	
	Add table
		Add a link
		
	
		Reference in a new issue