update test

2025-12-13 04:22:35 +00:00 · 2025-10-15 13:34:39 -07:00 · 2025-10-15 13:34:39 -07:00 · b563835a82
commit b563835a82
parent 571276f88c
5 changed files with 5490 additions and 29 deletions
--- a/tests/integration/tool_runtime/recordings/0b29d8fc2fee6f3086820af7b7db15b91bbde548bb9d9531a9e0c9cbbc2c66df.json
+++ b/tests/integration/tool_runtime/recordings/0b29d8fc2fee6f3086820af7b7db15b91bbde548bb9d9531a9e0c9cbbc2c66df.json
@ -0,0 +1,203 @@
 {
  "test_id": "tests/integration/tool_runtime/test_mcp.py::test_mcp_invocation[txt=ollama/llama3.2:3b-instruct-fp16]",
  "request": {
    "method": "POST",
    "url": "http://0.0.0.0:11434/v1/v1/chat/completions",
    "headers": {},
    "body": {
      "model": "llama3.2:3b-instruct-fp16",
      "messages": [
        {
          "role": "system",
          "content": "You are a helpful assistant."
        },
        {
          "role": "user",
          "content": [
            {
              "type": "text",
              "text": "Say hi to the world. Use tools to do so."
            }
          ]
        },
        {
          "role": "assistant",
          "content": "",
          "tool_calls": [
            {
              "index": 0,
              "id": "call_c1tlwvxc",
              "type": "function",
              "function": {
                "name": "greet_everyone",
                "arguments": "{\"url\":\"world\"}"
              }
            }
          ]
        },
        {
          "role": "tool",
          "tool_call_id": "call_c1tlwvxc",
          "content": [
            {
              "type": "text",
              "text": "Hello, world!"
            }
          ]
        },
        {
          "role": "assistant",
          "content": "I apologize, it seems like my previous response from the tool did not translate to a clear greeting.\n\nLet me try again using a different approach. I can use a text-to-speech conversion tool to say hello in various languages:\n\n\"Hello\"\n\n(or)\n\n\"Pong\"\n\n(in multiple languages such as Spanish: \"Hola\", French: \"Bonjour\", Chinese:, Japanese:, Korean:, or many others)"
        },
        {
          "role": "user",
          "content": [
            {
              "type": "text",
              "text": "What is the boiling point of polyjuice? Use tools to answer."
            }
          ]
        }
      ],
      "stream": true,
      "stream_options": {
        "include_usage": true
      },
      "tools": [
        {
          "type": "function",
          "function": {
            "name": "greet_everyone",
            "parameters": {
              "properties": {
                "url": {
                  "title": "Url",
                  "type": "string"
                }
              },
              "required": [
                "url"
              ],
              "title": "greet_everyoneArguments",
              "type": "object"
            }
          }
        },
        {
          "type": "function",
          "function": {
            "name": "get_boiling_point",
            "description": "\n        Returns the boiling point of a liquid in Celsius or Fahrenheit.\n\n        :param liquid_name: The name of the liquid\n        :param celsius: Whether to return the boiling point in Celsius\n        :return: The boiling point of the liquid in Celcius or Fahrenheit\n        ",
            "parameters": {
              "properties": {
                "liquid_name": {
                  "title": "Liquid Name",
                  "type": "string"
                },
                "celsius": {
                  "default": true,
                  "title": "Celsius",
                  "type": "boolean"
                }
              },
              "required": [
                "liquid_name"
              ],
              "title": "get_boiling_pointArguments",
              "type": "object"
            }
          }
        }
      ]
    },
    "endpoint": "/v1/chat/completions",
    "model": "llama3.2:3b-instruct-fp16"
  },
  "response": {
    "body": [
      {
        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
        "__data__": {
          "id": "rec-0b29d8fc2fee",
          "choices": [
            {
              "delta": {
                "content": "",
                "function_call": null,
                "refusal": null,
                "role": "assistant",
                "tool_calls": [
                  {
                    "index": 0,
                    "id": "call_h8atvnz3",
                    "function": {
                      "arguments": "{\"celsius\":\"true\",\"liquid_name\":\"polyjuice\"}",
                      "name": "get_boiling_point"
                    },
                    "type": "function"
                  }
                ]
              },
              "finish_reason": null,
              "index": 0,
              "logprobs": null
            }
          ],
          "created": 0,
          "model": "llama3.2:3b-instruct-fp16",
          "object": "chat.completion.chunk",
          "service_tier": null,
          "system_fingerprint": "fp_ollama",
          "usage": null
        }
      },
      {
        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
        "__data__": {
          "id": "rec-0b29d8fc2fee",
          "choices": [
            {
              "delta": {
                "content": "",
                "function_call": null,
                "refusal": null,
                "role": "assistant",
                "tool_calls": null
              },
              "finish_reason": "tool_calls",
              "index": 0,
              "logprobs": null
            }
          ],
          "created": 0,
          "model": "llama3.2:3b-instruct-fp16",
          "object": "chat.completion.chunk",
          "service_tier": null,
          "system_fingerprint": "fp_ollama",
          "usage": null
        }
      },
      {
        "__type__": "openai.types.chat.chat_completion_chunk.ChatCompletionChunk",
        "__data__": {
          "id": "rec-0b29d8fc2fee",
          "choices": [],
          "created": 0,
          "model": "llama3.2:3b-instruct-fp16",
          "object": "chat.completion.chunk",
          "service_tier": null,
          "system_fingerprint": "fp_ollama",
          "usage": {
            "completion_tokens": 29,
            "prompt_tokens": 414,
            "total_tokens": 443,
            "completion_tokens_details": null,
            "prompt_tokens_details": null
          }
        }
      }
    ],
    "is_streaming": true
  },
  "id_normalization_mapping": {}
 }
--- a/tests/integration/tool_runtime/recordings/522bf95412d73568d38c20303aba38543e717c9b270584bbf8134708f0600869.json
+++ b/tests/integration/tool_runtime/recordings/522bf95412d73568d38c20303aba38543e717c9b270584bbf8134708f0600869.json
--- a/tests/integration/tool_runtime/recordings/8850db6a210daca8a8c12ffd70edc7eefa75ac231676f7ad584de5d75883cab9.json
+++ b/tests/integration/tool_runtime/recordings/8850db6a210daca8a8c12ffd70edc7eefa75ac231676f7ad584de5d75883cab9.json
--- a/tests/integration/tool_runtime/recordings/d516b8d54a42c57c19cbc0a6b90aed82af458af76db2b58b0369e75ad9fb4f3f.json
+++ b/tests/integration/tool_runtime/recordings/d516b8d54a42c57c19cbc0a6b90aed82af458af76db2b58b0369e75ad9fb4f3f.json
@ -91,7 +91,7 @@
                "tool_calls": [
                  {
                    "index": 0,
-                    "id": "call_j1l3nnv3",
+                    "id": "call_c1tlwvxc",
                    "function": {
                      "arguments": "{\"url\":\"world\"}",
                      "name": "greet_everyone"
--- a/tests/integration/tool_runtime/test_mcp.py
+++ b/tests/integration/tool_runtime/test_mcp.py
@ -132,31 +132,3 @@ def test_mcp_invocation(llama_stack_client, text_model_id, mcp_server):
    assert tool_events[-1].result.tool_calls[0].tool_name == "greet_everyone"
    assert "hello" in final_response.output_text.lower()
    # when streaming, we currently don't check auth headers upfront and fail the request
    # early. but we should at least be generating a 401 later in the process.
    response_stream = agent.create_turn(
        session_id=session_id,
        messages=[
            {
                "type": "message",
                "role": "user",
                "content": [
                    {
                        "type": "input_text",
                        "text": "What is the boiling point of polyjuice? Use tools to answer.",
                    }
                ],
            }
        ],
        stream=True,
    )
    if isinstance(llama_stack_client, LlamaStackAsLibraryClient):
        with pytest.raises(AuthenticationRequiredError):
            for _ in response_stream:
                pass
    else:
        error_chunks = [chunk for chunk in response_stream if "error" in chunk.model_dump()]
        assert len(error_chunks) == 1
        chunk = error_chunks[0].model_dump()
        assert "Unauthorized" in chunk["error"]["message"]