test(verification): add streaming tool calling test (#1933)

# What does this PR do? ## Test Plan --- [//]: # (BEGIN SAPLING FOOTER) Stack created with [Sapling](https://sapling-scm.com). Best reviewed with [ReviewStack](https://reviewstack.dev/meta-llama/llama-stack/pull/1933). * #1934 * __->__ #1933
2025-04-10 16:58:06 -07:00 · 2025-04-10 16:58:06 -07:00 · a4cc4b7e31
commit a4cc4b7e31
parent 49955a06b1
1 changed files with 55 additions and 0 deletions
--- a/tests/verifications/openai_api/test_chat_completion.py
+++ b/tests/verifications/openai_api/test_chat_completion.py
@ -4,6 +4,7 @@
 # This source code is licensed under the terms described in the LICENSE file in
 # the root directory of this source tree.
 import json
 import re
 from typing import Any
@ -225,6 +226,60 @@ def test_chat_non_streaming_tool_calling(request, openai_client, model, provider
    # TODO: add detailed type validation
@pytest.mark.parametrize(
    "case",
    chat_completion_test_cases["test_tool_calling"]["test_params"]["case"],
    ids=case_id_generator,
 )
 def test_chat_streaming_tool_calling(request, openai_client, model, provider, verification_config, case):
    test_name_base = get_base_test_name(request)
    if should_skip_test(verification_config, provider, model, test_name_base):
        pytest.skip(f"Skipping {test_name_base} for model {model} on provider {provider} based on config.")
    stream = openai_client.chat.completions.create(
        model=model,
        messages=case["input"]["messages"],
        tools=case["input"]["tools"],
        stream=True,
    )
    # Accumulate partial tool_calls here
    tool_calls_buffer = {}
    current_id = None
    # Process streaming chunks
    for chunk in stream:
        choice = chunk.choices[0]
        delta = choice.delta
        if delta.tool_calls is None:
            continue
        for tool_call_delta in delta.tool_calls:
            if tool_call_delta.id:
                current_id = tool_call_delta.id
            call_id = current_id
            func_delta = tool_call_delta.function
            if call_id not in tool_calls_buffer:
                tool_calls_buffer[call_id] = {
                    "id": call_id,
                    "type": tool_call_delta.type,
                    "name": func_delta.name,
                    "arguments": "",
                }
            if func_delta.arguments:
                tool_calls_buffer[call_id]["arguments"] += func_delta.arguments
    assert len(tool_calls_buffer) == 1
    for call in tool_calls_buffer.values():
        assert len(call["id"]) > 0
        assert call["name"] == "get_weather"
        args_dict = json.loads(call["arguments"])
        assert "san francisco" in args_dict["location"].lower()
 # --- Helper functions (structured output validation) ---