Merge pull request #5232 from Penagwin/fix_anthropic_tool_streaming_index

Fixes the `tool_use` indexes not being correctly mapped
2024-08-17 14:33:50 -07:00 · 2024-08-17 14:33:50 -07:00 · be37310e94
commit be37310e94
parent a60fc3ad70 b0d13f42ed
2 changed files with 75 additions and 4 deletions
--- a/litellm/llms/anthropic.py
+++ b/litellm/llms/anthropic.py
@ -1122,6 +1122,7 @@ class ModelResponseIterator:
        self.streaming_response = streaming_response
        self.response_iterator = self.streaming_response
        self.content_blocks: List[ContentBlockDelta] = []
+        self.tool_index = -1

    def check_empty_tool_call_args(self) -> bool:
        """
@ -1171,7 +1172,7 @@ class ModelResponseIterator:
                            "name": None,
                            "arguments": content_block["delta"]["partial_json"],
                        },
-                        "index": content_block["index"],
+                        "index": self.tool_index,
                    }
            elif type_chunk == "content_block_start":
                """
@ -1183,6 +1184,7 @@ class ModelResponseIterator:
                if content_block_start["content_block"]["type"] == "text":
                    text = content_block_start["content_block"]["text"]
                elif content_block_start["content_block"]["type"] == "tool_use":
+                    self.tool_index += 1
                    tool_use = {
                        "id": content_block_start["content_block"]["id"],
                        "type": "function",
@ -1190,7 +1192,7 @@ class ModelResponseIterator:
                            "name": content_block_start["content_block"]["name"],
                            "arguments": "",
                        },
-                        "index": content_block_start["index"],
+                        "index": self.tool_index,
                    }
            elif type_chunk == "content_block_stop":
                content_block_stop = ContentBlockStop(**chunk)  # type: ignore
@ -1204,7 +1206,7 @@ class ModelResponseIterator:
                            "name": None,
                            "arguments": "{}",
                        },
-                        "index": content_block_stop["index"],
+                        "index": self.tool_index,
                    }
            elif type_chunk == "message_delta":
                """
--- a/litellm/tests/test_anthropic_completion.py
+++ b/litellm/tests/test_anthropic_completion.py
@ -10,6 +10,7 @@ from dotenv import load_dotenv

 import litellm.types
 import litellm.types.utils
+from litellm.llms.anthropic import ModelResponseIterator

 load_dotenv()
 import io
@ -150,6 +151,74 @@ def test_anthropic_completion_e2e(stream):
        assert message_stop_received is True


+anthropic_chunk_list = [
+    {"type": "content_block_start", "index": 0, "content_block": {"type": "text", "text": ""}},
+    {"type": "content_block_delta", "index": 0, "delta": {"type": "text_delta", "text": "To"}},
+    {"type": "content_block_delta", "index": 0, "delta": {"type": "text_delta", "text": " answer"}},
+    {"type": "content_block_delta", "index": 0,
+     "delta": {"type": "text_delta", "text": " your question about the weather"}},
+    {"type": "content_block_delta", "index": 0, "delta": {"type": "text_delta", "text": " in Boston and Los"}},
+    {"type": "content_block_delta", "index": 0, "delta": {"type": "text_delta", "text": " Angeles today, I'll"}},
+    {"type": "content_block_delta", "index": 0, "delta": {"type": "text_delta", "text": " need to"}},
+    {"type": "content_block_delta", "index": 0, "delta": {"type": "text_delta", "text": " use"}},
+    {"type": "content_block_delta", "index": 0, "delta": {"type": "text_delta", "text": " the"}},
+    {"type": "content_block_delta", "index": 0, "delta": {"type": "text_delta", "text": " get_current_weather"}},
+    {"type": "content_block_delta", "index": 0, "delta": {"type": "text_delta", "text": " function"}},
+    {"type": "content_block_delta", "index": 0, "delta": {"type": "text_delta", "text": " for"}},
+    {"type": "content_block_delta", "index": 0, "delta": {"type": "text_delta", "text": " both"}},
+    {"type": "content_block_delta", "index": 0, "delta": {"type": "text_delta", "text": " cities"}},
+    {"type": "content_block_delta", "index": 0, "delta": {"type": "text_delta", "text": ". Let"}},
+    {"type": "content_block_delta", "index": 0, "delta": {"type": "text_delta", "text": " me fetch"}},
+    {"type": "content_block_delta", "index": 0, "delta": {"type": "text_delta", "text": " that"}},
+    {"type": "content_block_delta", "index": 0, "delta": {"type": "text_delta", "text": " information"}},
+    {"type": "content_block_delta", "index": 0, "delta": {"type": "text_delta", "text": " for"}},
+    {"type": "content_block_delta", "index": 0, "delta": {"type": "text_delta", "text": " you."}},
+    {"type": "content_block_stop", "index": 0},
+    {"type": "content_block_start", "index": 1,
+     "content_block": {"type": "tool_use", "id": "toolu_12345", "name": "get_current_weather", "input": {}}},
+    {"type": "content_block_delta", "index": 1, "delta": {"type": "input_json_delta", "partial_json": ""}},
+    {"type": "content_block_delta", "index": 1, "delta": {"type": "input_json_delta", "partial_json": "{\"locat"}},
+    {"type": "content_block_delta", "index": 1, "delta": {"type": "input_json_delta", "partial_json": "ion\": \"Bos"}},
+    {"type": "content_block_delta", "index": 1, "delta": {"type": "input_json_delta", "partial_json": "ton, MA\"}"}},
+    {"type": "content_block_stop", "index": 1},
+    {"type": "content_block_start", "index": 2,
+     "content_block": {"type": "tool_use", "id": "toolu_023423423", "name": "get_current_weather", "input": {}}},
+    {"type": "content_block_delta", "index": 2, "delta": {"type": "input_json_delta", "partial_json": ""}},
+    {"type": "content_block_delta", "index": 2, "delta": {"type": "input_json_delta", "partial_json": "{\"l"}},
+    {"type": "content_block_delta", "index": 2, "delta": {"type": "input_json_delta", "partial_json": "oca"}},
+    {"type": "content_block_delta", "index": 2, "delta": {"type": "input_json_delta", "partial_json": "tio"}},
+    {"type": "content_block_delta", "index": 2, "delta": {"type": "input_json_delta", "partial_json": "n\": \"Lo"}},
+    {"type": "content_block_delta", "index": 2, "delta": {"type": "input_json_delta", "partial_json": "s Angel"}},
+    {"type": "content_block_delta", "index": 2, "delta": {"type": "input_json_delta", "partial_json": "es, CA\"}"}},
+    {"type": "content_block_stop", "index": 2},
+    {"type": "message_delta", "delta": {"stop_reason": "tool_use", "stop_sequence": None},
+     "usage": {"output_tokens": 137}},
+    {"type": "message_stop"}
+]
+
+
+def test_anthropic_tool_streaming():
+    """
+    OpenAI starts tool_use indexes at 0 for the first tool, regardless of preceding text.
+
+    Anthropic gives tool_use indexes starting at the first chunk, meaning they often start at 1
+    when they should start at 0
+    """
+    litellm.set_verbose = True
+    response_iter = ModelResponseIterator([], False)
+
+    # First index is 0, we'll start earlier because incrementing is easier
+    correct_tool_index = -1
+    for chunk in anthropic_chunk_list:
+        parsed_chunk = response_iter.chunk_parser(chunk)
+        if tool_use := parsed_chunk.get('tool_use'):
+
+            # We only increment when a new block starts
+            if tool_use.get('id') is not None:
+                correct_tool_index += 1
+            assert tool_use['index'] == correct_tool_index
+
+
@pytest.mark.asyncio
 async def test_anthropic_router_completion_e2e():
    litellm.set_verbose = True
@ -275,4 +344,4 @@ def test_anthropic_tool_calling_translation():
    print(translated_params["messages"])

    assert len(translated_params["messages"]) > 0
-    assert translated_params["messages"][0]["role"] == "user"
+    assert translated_params["messages"][0]["role"] == "user"