From 1b2e116a2ad8f6e8661b951fdbd7d9bf9ec19994 Mon Sep 17 00:00:00 2001 From: ehhuang Date: Fri, 25 Apr 2025 13:16:16 -0700 Subject: [PATCH] fix: tool call encoded twice (#2034) # What does this PR do? ## Test Plan LLAMA_STACK_CONFIG=http://localhost:5002 pytest -s -v tests/integration/inference --safety-shield meta-llama/Llama-Guard-3-8B --vision-model meta-llama/Llama-4-Scout-17B-16E-Instruct --text-model meta-llama/Llama-4-Scout-17B-16E-Instruct --- llama_stack/models/llama/llama4/chat_format.py | 1 + 1 file changed, 1 insertion(+) diff --git a/llama_stack/models/llama/llama4/chat_format.py b/llama_stack/models/llama/llama4/chat_format.py index 1debadcc5..1574eeb5e 100644 --- a/llama_stack/models/llama/llama4/chat_format.py +++ b/llama_stack/models/llama/llama4/chat_format.py @@ -303,6 +303,7 @@ class ChatFormat: arguments_json=json.dumps(tool_arguments), ) ) + content = "" return RawMessage( role="assistant",