fix(anthropic.py): fix tool calling + streaming issue

2024-05-11 20:15:36 -07:00 · 2024-05-11 20:15:36 -07:00 · a456f6bf2b
commit a456f6bf2b
parent 83beb41096
1 changed files with 30 additions and 1 deletions
--- a/litellm/llms/anthropic.py
+++ b/litellm/llms/anthropic.py
@ -165,6 +165,9 @@ class AnthropicChatCompletion(BaseLLM):
        print_verbose,
        encoding,
    ) -> CustomStreamWrapper:
+        """
+        Return stream object for tool-calling + streaming
+        """
        ## LOGGING
        logging_obj.post_call(
            input=messages,
@ -202,6 +205,18 @@ class AnthropicChatCompletion(BaseLLM):
                message=str(completion_response["error"]),
                status_code=response.status_code,
            )
+        _message = litellm.Message(
+            tool_calls=tool_calls,
+            content=text_content or None,
+        )
+        model_response.choices[0].message = _message  # type: ignore
+        model_response._hidden_params["original_response"] = completion_response[
+            "content"
+        ]  # allow user to access raw anthropic tool calling response
+
+        model_response.choices[0].finish_reason = map_finish_reason(
+            completion_response["stop_reason"]
+        )

        print_verbose("INSIDE ANTHROPIC STREAMING TOOL CALLING CONDITION BLOCK")
        # return an iterator
@ -392,13 +407,27 @@ class AnthropicChatCompletion(BaseLLM):
        litellm_params=None,
        logger_fn=None,
        headers={},
-    ) -> ModelResponse:
+    ) -> Union[ModelResponse, CustomStreamWrapper]:
        self.async_handler = AsyncHTTPHandler(
            timeout=httpx.Timeout(timeout=600.0, connect=5.0)
        )
        response = await self.async_handler.post(
            api_base, headers=headers, data=json.dumps(data)
        )
+        if stream and _is_function_call:
+            return self.process_streaming_response(
+                model=model,
+                response=response,
+                model_response=model_response,
+                stream=stream,
+                logging_obj=logging_obj,
+                api_key=api_key,
+                data=data,
+                messages=messages,
+                print_verbose=print_verbose,
+                optional_params=optional_params,
+                encoding=encoding,
+            )
        return self.process_response(
            model=model,
            response=response,