forked from phoenix-oss/llama-stack-mirror
		
	# Problem
Our current Agent framework has discrepancies in definition on how we
handle server side and client side tools.
1. Server Tools: a single Turn is returned including `ToolExecutionStep`
in agenst
2. Client Tools: `create_agent_turn` is called in loop with client agent
lib yielding the agent chunk
ad6ffc63df/src/llama_stack_client/lib/agents/agent.py (L186-L211)
This makes it inconsistent to work with server & client tools. It also
complicates the logs to telemetry to get information about agents turn /
history for observability.
#### Principle
The same `turn_id` should be used to represent the steps required to
complete a user message including client tools.
## Solution
1. `AgentTurnResponseEventType.turn_awaiting_input` status to indicate
that the current turn is not completed, and awaiting tool input
2. `continue_agent_turn` endpoint to update agent turn with client's
tool response.
# What does this PR do?
- Skeleton API as example
## Test Plan
[Describe the tests you ran to verify your changes with result
summaries. *Provide clear instructions so the plan can be easily
re-executed.*]
- Just API update, no functionality change
```
llama stack run + client-sdk test
```
<img width="842" alt="image"
src="https://github.com/user-attachments/assets/7ac56b5f-f424-4632-9476-7e0f57555bc3"
/>
[//]: # (## Documentation)
		
	
			
		
			
				
	
	
		
			98 lines
		
	
	
	
		
			3.3 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
			
		
		
	
	
			98 lines
		
	
	
	
		
			3.3 KiB
		
	
	
	
		
			Python
		
	
	
	
	
	
| # Copyright (c) Meta Platforms, Inc. and affiliates.
 | |
| # All rights reserved.
 | |
| #
 | |
| # This source code is licensed under the terms described in the LICENSE file in
 | |
| # the root directory of this source tree.
 | |
| 
 | |
| import json
 | |
| import logging
 | |
| import uuid
 | |
| from datetime import datetime
 | |
| from typing import List, Optional
 | |
| 
 | |
| from pydantic import BaseModel
 | |
| 
 | |
| from llama_stack.apis.agents import ToolExecutionStep, Turn
 | |
| from llama_stack.providers.utils.kvstore import KVStore
 | |
| 
 | |
| log = logging.getLogger(__name__)
 | |
| 
 | |
| 
 | |
| class AgentSessionInfo(BaseModel):
 | |
|     session_id: str
 | |
|     session_name: str
 | |
|     vector_db_id: Optional[str] = None
 | |
|     started_at: datetime
 | |
| 
 | |
| 
 | |
| class AgentPersistence:
 | |
|     def __init__(self, agent_id: str, kvstore: KVStore):
 | |
|         self.agent_id = agent_id
 | |
|         self.kvstore = kvstore
 | |
| 
 | |
|     async def create_session(self, name: str) -> str:
 | |
|         session_id = str(uuid.uuid4())
 | |
|         session_info = AgentSessionInfo(
 | |
|             session_id=session_id,
 | |
|             session_name=name,
 | |
|             started_at=datetime.now(),
 | |
|         )
 | |
|         await self.kvstore.set(
 | |
|             key=f"session:{self.agent_id}:{session_id}",
 | |
|             value=session_info.model_dump_json(),
 | |
|         )
 | |
|         return session_id
 | |
| 
 | |
|     async def get_session_info(self, session_id: str) -> Optional[AgentSessionInfo]:
 | |
|         value = await self.kvstore.get(
 | |
|             key=f"session:{self.agent_id}:{session_id}",
 | |
|         )
 | |
|         if not value:
 | |
|             return None
 | |
| 
 | |
|         return AgentSessionInfo(**json.loads(value))
 | |
| 
 | |
|     async def add_vector_db_to_session(self, session_id: str, vector_db_id: str):
 | |
|         session_info = await self.get_session_info(session_id)
 | |
|         if session_info is None:
 | |
|             raise ValueError(f"Session {session_id} not found")
 | |
| 
 | |
|         session_info.vector_db_id = vector_db_id
 | |
|         await self.kvstore.set(
 | |
|             key=f"session:{self.agent_id}:{session_id}",
 | |
|             value=session_info.model_dump_json(),
 | |
|         )
 | |
| 
 | |
|     async def add_turn_to_session(self, session_id: str, turn: Turn):
 | |
|         await self.kvstore.set(
 | |
|             key=f"session:{self.agent_id}:{session_id}:{turn.turn_id}",
 | |
|             value=turn.model_dump_json(),
 | |
|         )
 | |
| 
 | |
|     async def get_session_turns(self, session_id: str) -> List[Turn]:
 | |
|         values = await self.kvstore.range(
 | |
|             start_key=f"session:{self.agent_id}:{session_id}:",
 | |
|             end_key=f"session:{self.agent_id}:{session_id}:\xff\xff\xff\xff",
 | |
|         )
 | |
|         turns = []
 | |
|         for value in values:
 | |
|             try:
 | |
|                 turn = Turn(**json.loads(value))
 | |
|                 turns.append(turn)
 | |
|             except Exception as e:
 | |
|                 log.error(f"Error parsing turn: {e}")
 | |
|                 continue
 | |
|         turns.sort(key=lambda x: (x.completed_at or datetime.min))
 | |
|         return turns
 | |
| 
 | |
|     async def set_in_progress_tool_call_step(self, session_id: str, turn_id: str, step: ToolExecutionStep):
 | |
|         await self.kvstore.set(
 | |
|             key=f"in_progress_tool_call_step:{self.agent_id}:{session_id}:{turn_id}",
 | |
|             value=step.model_dump_json(),
 | |
|         )
 | |
| 
 | |
|     async def get_in_progress_tool_call_step(self, session_id: str, turn_id: str) -> Optional[ToolExecutionStep]:
 | |
|         value = await self.kvstore.get(
 | |
|             key=f"in_progress_tool_call_step:{self.agent_id}:{session_id}:{turn_id}",
 | |
|         )
 | |
|         return ToolExecutionStep(**json.loads(value)) if value else None
 |