(fix) OpenAI's optional messages[].name does not work with Mistral API (#6701)

* use helper for _transform_messages mistral * add test_message_with_name to base LLMChat test * fix linting
2024-11-11 18:03:41 -08:00 · 2024-11-11 18:03:41 -08:00 · 9d20c19e0c
commit 9d20c19e0c
parent c3bc9e6b12
4 changed files with 100 additions and 38 deletions
--- a/litellm/llms/mistral/mistral_chat_transformation.py
+++ b/litellm/llms/mistral/mistral_chat_transformation.py
@ -10,6 +10,7 @@ import types
 from typing import List, Literal, Optional, Tuple, Union

 from litellm.secret_managers.main import get_secret_str
+from litellm.types.llms.openai import AllMessageValues


 class MistralConfig:
@ -148,3 +149,59 @@ class MistralConfig:
            or get_secret_str("MISTRAL_API_KEY")
        )
        return api_base, dynamic_api_key
+
+    @classmethod
+    def _transform_messages(cls, messages: List[AllMessageValues]):
+        """
+        - handles scenario where content is list and not string
+        - content list is just text, and no images
+        - if image passed in, then just return as is (user-intended)
+        - if `name` is passed, then drop it for mistral API: https://github.com/BerriAI/litellm/issues/6696
+
+        Motivation: mistral api doesn't support content as a list
+        """
+        new_messages = []
+        for m in messages:
+            special_keys = ["role", "content", "tool_calls", "function_call"]
+            extra_args = {}
+            if isinstance(m, dict):
+                for k, v in m.items():
+                    if k not in special_keys:
+                        extra_args[k] = v
+            texts = ""
+            _content = m.get("content")
+            if _content is not None and isinstance(_content, list):
+                for c in _content:
+                    _text: Optional[str] = c.get("text")
+                    if c["type"] == "image_url":
+                        return messages
+                    elif c["type"] == "text" and isinstance(_text, str):
+                        texts += _text
+            elif _content is not None and isinstance(_content, str):
+                texts = _content
+
+            new_m = {"role": m["role"], "content": texts, **extra_args}
+
+            if m.get("tool_calls"):
+                new_m["tool_calls"] = m.get("tool_calls")
+
+            new_m = cls._handle_name_in_message(new_m)
+
+            new_messages.append(new_m)
+        return new_messages
+
+    @classmethod
+    def _handle_name_in_message(cls, message: dict) -> dict:
+        """
+        Mistral API only supports `name` in tool messages
+
+        If role == tool, then we keep `name`
+        Otherwise, we drop `name`
+        """
+        if message.get("name") is not None:
+            if message["role"] == "tool":
+                message["name"] = message.get("name")
+            else:
+                message.pop("name", None)
+
+        return message
--- a/litellm/llms/prompt_templates/factory.py
+++ b/litellm/llms/prompt_templates/factory.py
@ -259,43 +259,6 @@ def mistral_instruct_pt(messages):
    return prompt


-def mistral_api_pt(messages):
-    """
-    - handles scenario where content is list and not string
-    - content list is just text, and no images
-    - if image passed in, then just return as is (user-intended)
-
-    Motivation: mistral api doesn't support content as a list
-    """
-    new_messages = []
-    for m in messages:
-        special_keys = ["role", "content", "tool_calls", "function_call"]
-        extra_args = {}
-        if isinstance(m, dict):
-            for k, v in m.items():
-                if k not in special_keys:
-                    extra_args[k] = v
-        texts = ""
-        if m.get("content", None) is not None and isinstance(m["content"], list):
-            for c in m["content"]:
-                if c["type"] == "image_url":
-                    return messages
-                elif c["type"] == "text" and isinstance(c["text"], str):
-                    texts += c["text"]
-        elif m.get("content", None) is not None and isinstance(m["content"], str):
-            texts = m["content"]
-
-        new_m = {"role": m["role"], "content": texts, **extra_args}
-
-        if new_m["role"] == "tool" and m.get("name"):
-            new_m["name"] = m["name"]
-        if m.get("tool_calls"):
-            new_m["tool_calls"] = m["tool_calls"]
-
-        new_messages.append(new_m)
-    return new_messages
-
-
 # Falcon prompt template - from https://github.com/lm-sys/FastChat/blob/main/fastchat/conversation.py#L110
 def falcon_instruct_pt(messages):
    prompt = ""
@ -2853,7 +2816,7 @@ def prompt_factory(
        else:
            return gemini_text_image_pt(messages=messages)
    elif custom_llm_provider == "mistral":
-        return mistral_api_pt(messages=messages)
+        return litellm.MistralConfig._transform_messages(messages=messages)
    elif custom_llm_provider == "bedrock":
        if "amazon.titan-text" in model:
            return amazon_titan_pt(messages=messages)
--- a/tests/llm_translation/base_llm_unit_tests.py
+++ b/tests/llm_translation/base_llm_unit_tests.py
@ -45,6 +45,14 @@ class BaseLLMChatTest(ABC):
        )
        assert response is not None

+    def test_message_with_name(self):
+        base_completion_call_args = self.get_base_completion_call_args()
+        messages = [
+            {"role": "user", "content": "Hello", "name": "test_name"},
+        ]
+        response = litellm.completion(**base_completion_call_args, messages=messages)
+        assert response is not None
+
    @pytest.fixture
    def pdf_messages(self):
        import base64
--- a/tests/llm_translation/test_mistral_api.py
+++ b/tests/llm_translation/test_mistral_api.py
@ -0,0 +1,34 @@
+import asyncio
+import os
+import sys
+import traceback
+
+from dotenv import load_dotenv
+
+import litellm.types
+import litellm.types.utils
+from litellm.llms.anthropic.chat import ModelResponseIterator
+
+load_dotenv()
+import io
+import os
+
+sys.path.insert(
+    0, os.path.abspath("../..")
+)  # Adds the parent directory to the system path
+from typing import Optional
+from unittest.mock import MagicMock, patch
+
+import pytest
+
+import litellm
+
+from litellm.llms.anthropic.common_utils import process_anthropic_headers
+from httpx import Headers
+from base_llm_unit_tests import BaseLLMChatTest
+
+
+class TestMistralCompletion(BaseLLMChatTest):
+    def get_base_completion_call_args(self) -> dict:
+        litellm.set_verbose = True
+        return {"model": "mistral/mistral-small-latest"}