mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-06-28 02:53:30 +00:00
test: remove old test (#1334)
Summary: This test is no longer relevant. We updated the default system prompt in https://github.com/meta-llama/llama-stack/pull/1310, and system override behavior is already unit-tested in test_prompt_adapter.py Test Plan: read
This commit is contained in:
parent
2faee24873
commit
ba3bedc7e9
1 changed files with 0 additions and 81 deletions
|
@ -314,87 +314,6 @@ def test_tool_choice(llama_stack_client, agent_config):
|
|||
assert len(tool_execution_steps) >= 1 and tool_execution_steps[0].tool_calls[0].tool_name == "get_boiling_point"
|
||||
|
||||
|
||||
# TODO: fix this flaky test
|
||||
def xtest_override_system_message_behavior(llama_stack_client, agent_config):
|
||||
client_tool = get_boiling_point
|
||||
agent_config = {
|
||||
**agent_config,
|
||||
"instructions": "You are a pirate",
|
||||
"client_tools": [client_tool.get_tool_definition()],
|
||||
"model": "meta-llama/Llama-3.2-3B-Instruct",
|
||||
}
|
||||
|
||||
agent = Agent(llama_stack_client, agent_config, client_tools=(client_tool,))
|
||||
session_id = agent.create_session(f"test-session-{uuid4()}")
|
||||
|
||||
response = agent.create_turn(
|
||||
messages=[
|
||||
{
|
||||
"role": "user",
|
||||
"content": "tell me a joke about bicycles",
|
||||
},
|
||||
],
|
||||
session_id=session_id,
|
||||
)
|
||||
|
||||
logs = [str(log) for log in EventLogger().log(response) if log is not None]
|
||||
logs_str = "".join(logs)
|
||||
# can't tell a joke: "I don't have a function"
|
||||
assert "function" in logs_str
|
||||
|
||||
# with system message behavior replace
|
||||
instructions = """
|
||||
You are a helpful assistant. You have access to functions, but you should only use them if they are required.
|
||||
|
||||
You are an expert in composing functions. You are given a question and a set of possible functions.
|
||||
Based on the question, you may or may not need to make one or more function/tool calls to achieve the purpose.
|
||||
If none of the function can be used, don't return [], instead answer the question directly without using functions. If the given question lacks the parameters required by the function,
|
||||
also point it out.
|
||||
|
||||
{{ function_description }}
|
||||
"""
|
||||
agent_config = {
|
||||
**agent_config,
|
||||
"instructions": instructions,
|
||||
"client_tools": [client_tool.get_tool_definition()],
|
||||
"tool_config": {
|
||||
"system_message_behavior": "replace",
|
||||
},
|
||||
}
|
||||
|
||||
agent = Agent(llama_stack_client, agent_config, client_tools=(client_tool,))
|
||||
session_id = agent.create_session(f"test-session-{uuid4()}")
|
||||
|
||||
response = agent.create_turn(
|
||||
messages=[
|
||||
{
|
||||
"role": "user",
|
||||
"content": "tell me a joke about bicycles",
|
||||
},
|
||||
],
|
||||
session_id=session_id,
|
||||
)
|
||||
|
||||
logs = [str(log) for log in EventLogger().log(response) if log is not None]
|
||||
logs_str = "".join(logs)
|
||||
assert "bicycle" in logs_str
|
||||
|
||||
response = agent.create_turn(
|
||||
messages=[
|
||||
{
|
||||
"role": "user",
|
||||
"content": "What is the boiling point of polyjuice?",
|
||||
},
|
||||
],
|
||||
session_id=session_id,
|
||||
)
|
||||
|
||||
logs = [str(log) for log in EventLogger().log(response) if log is not None]
|
||||
logs_str = "".join(logs)
|
||||
assert "-100" in logs_str
|
||||
assert "get_boiling_point" in logs_str
|
||||
|
||||
|
||||
@pytest.mark.parametrize("rag_tool_name", ["builtin::rag/knowledge_search", "builtin::rag"])
|
||||
def test_rag_agent(llama_stack_client, agent_config, rag_tool_name):
|
||||
urls = ["chat.rst", "llama3.rst", "memory_optimizations.rst", "lora_finetune.rst"]
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue