fix(vertex_ai.py): revert system instructions - unable to find supported vertex version

2025-04-26 03:04:13 +00:00 · 2024-05-20 06:30:11 -07:00 · 2024-05-20 06:30:11 -07:00 · 49b71c8118
commit 49b71c8118
parent 45c46a84d0
1 changed files with 4 additions and 32 deletions
--- a/litellm/llms/vertex_ai.py
+++ b/litellm/llms/vertex_ai.py
@ -3,7 +3,7 @@ import json
 from enum import Enum
 import requests  # type: ignore
 import time
-from typing import Callable, Optional, Union, List, Literal, Tuple
+from typing import Callable, Optional, Union, List, Literal
 from litellm.utils import ModelResponse, Usage, CustomStreamWrapper, map_finish_reason
 import litellm, uuid
 import httpx, inspect  # type: ignore
@ -336,39 +336,14 @@ def _process_gemini_image(image_url: str) -> PartType:
        raise e
-def _extract_system_prompt_from_messages(messages: list) -> Optional[ContentType]:
+def _gemini_convert_messages_with_history(messages: list) -> List[ContentType]:
    # Separate system prompt from rest of message
    system_prompt_indices = []
    _parts: List[PartType] = []
    for idx, message in enumerate(messages):
        if message["role"] == "system":
            _part = PartType(text=message["content"])
            _parts.append(_part)
            system_prompt_indices.append(idx)
    if len(system_prompt_indices) > 0:
        for idx in reversed(system_prompt_indices):
            messages.pop(idx)
    if len(_parts) > 0:
        return ContentType(parts=_parts)
    return None
 def _gemini_convert_messages_with_history(
    messages: list,
 ) -> Tuple[Optional[ContentType], List[ContentType]]:
    """
    Converts given messages from OpenAI format to Gemini format
    - Parts must be iterable
    - Roles must alternate b/w 'user' and 'model' (same as anthropic -> merge consecutive roles)
    - Please ensure that function response turn comes immediately after a function call turn
    Returns:
    - Tuple[Optional[system_instructions], messages]
    """
    system_instructions = _extract_system_prompt_from_messages(messages=messages)
    user_message_types = {"user", "system"}
    contents: List[ContentType] = []
@ -429,7 +404,7 @@ def _gemini_convert_messages_with_history(
                )
            )
-    return system_instructions, contents
+    return contents
 def _gemini_vision_convert_messages(messages: list):
@ -724,9 +699,7 @@ def completion(
            print_verbose("\nMaking VertexAI Gemini Pro / Pro Vision Call")
            print_verbose(f"\nProcessing input messages = {messages}")
            tools = optional_params.pop("tools", None)
-            system_instruction, content = _gemini_convert_messages_with_history(
+            content = _gemini_convert_messages_with_history(messages=messages)
                messages=messages
            )
            stream = optional_params.pop("stream", False)
            if stream == True:
                request_str += f"response = llm_model.generate_content({content}, generation_config=GenerationConfig(**{optional_params}), safety_settings={safety_settings}, stream={stream})\n"
@ -763,7 +736,6 @@ def completion(
            ## LLM Call
            response = llm_model.generate_content(
                contents=content,
                system_instruction=system_instruction,
                generation_config=optional_params,
                safety_settings=safety_settings,
                tools=tools,