Fix fireworks and update the test

Don't look for eom_id / eot_id sadly since providers don't return the last token
2025-12-08 19:10:56 +00:00 · 2024-10-07 17:43:47 -07:00 · 2024-10-07 17:43:47 -07:00 · dba7caf1d0
commit dba7caf1d0
parent bbd3a02615
4 changed files with 37 additions and 37 deletions
--- a/llama_stack/providers/tests/inference/provider_config_example.yaml
+++ b/llama_stack/providers/tests/inference/provider_config_example.yaml
@ -13,3 +13,13 @@ providers:
    config:
      host: localhost
      port: 7002
+  - provider_id: test-together
+    provider_type: remote::together
+    config: {}
+# if a provider needs private keys from the client, they use the
+# "get_request_provider_data" function (see distribution/request_headers.py)
+# this is a place to provide such data.
+provider_data:
+  "test-together":
+    together_api_key:
+      0xdeadbeefputrealapikeyhere
--- a/llama_stack/providers/tests/inference/test_inference.py
+++ b/llama_stack/providers/tests/inference/test_inference.py
@ -222,8 +222,9 @@ async def test_chat_completion_with_tool_calling(

    message = response[0].completion_message

-    stop_reason = get_expected_stop_reason(inference_settings["common_params"]["model"])
-    assert message.stop_reason == stop_reason
+    # This is not supported in most providers :/ they don't return eom_id / eot_id
+    # stop_reason = get_expected_stop_reason(inference_settings["common_params"]["model"])
+    # assert message.stop_reason == stop_reason
    assert message.tool_calls is not None
    assert len(message.tool_calls) > 0

@ -266,10 +267,12 @@ async def test_chat_completion_with_tool_calling_streaming(
    assert len(grouped[ChatCompletionResponseEventType.complete]) == 1

    end = grouped[ChatCompletionResponseEventType.complete][0]
-    expected_stop_reason = get_expected_stop_reason(
-        inference_settings["common_params"]["model"]
-    )
-    assert end.event.stop_reason == expected_stop_reason
+
+    # This is not supported in most providers :/ they don't return eom_id / eot_id
+    # expected_stop_reason = get_expected_stop_reason(
+    #     inference_settings["common_params"]["model"]
+    # )
+    # assert end.event.stop_reason == expected_stop_reason

    model = inference_settings["common_params"]["model"]
    if "Llama3.1" in model:
@ -281,7 +284,7 @@ async def test_chat_completion_with_tool_calling_streaming(
        assert first.event.delta.parse_status == ToolCallParseStatus.started

    last = grouped[ChatCompletionResponseEventType.progress][-1]
-    assert last.event.stop_reason == expected_stop_reason
+    # assert last.event.stop_reason == expected_stop_reason
    assert last.event.delta.parse_status == ToolCallParseStatus.success
    assert isinstance(last.event.delta.content, ToolCall)