fix(test_amazing_vertex_completion.py): handle vertex ai rate limit error

2024-04-05 14:02:26 -07:00 · 2024-04-05 14:02:26 -07:00 · f7537f2cdf
commit f7537f2cdf
parent 3dbb547af0
1 changed files with 44 additions and 12 deletions
--- a/litellm/tests/test_amazing_vertex_completion.py
+++ b/litellm/tests/test_amazing_vertex_completion.py
@ -487,6 +487,35 @@ def test_gemini_pro_vision_base64():
 def test_gemini_pro_function_calling():
    load_vertex_ai_credentials()
    tools = [
        {
            "type": "function",
            "function": {
                "name": "get_current_weather",
                "description": "Get the current weather in a given location",
                "parameters": {
                    "type": "object",
                    "properties": {
                        "location": {
                            "type": "string",
                            "description": "The city and state, e.g. San Francisco, CA",
                        },
                        "unit": {"type": "string", "enum": ["celsius", "fahrenheit"]},
                    },
                    "required": ["location"],
                },
            },
        }
    ]
    messages = [{"role": "user", "content": "What's the weather like in Boston today?"}]
    completion = litellm.completion(
        model="gemini-pro", messages=messages, tools=tools, tool_choice="auto"
    )
    print(f"completion: {completion}")
    assert completion.choices[0].message.content is None
    assert len(completion.choices[0].message.tool_calls) == 1
    try:
        load_vertex_ai_credentials()
        tools = [
@ -557,6 +586,7 @@ def test_gemini_pro_function_calling_streaming():
        }
    ]
    messages = [{"role": "user", "content": "What's the weather like in Boston today?"}]
    try:
        completion = litellm.completion(
            model="gemini-pro",
            messages=messages,
@ -569,6 +599,8 @@ def test_gemini_pro_function_calling_streaming():
        # assert len(completion.choices[0].message.tool_calls) == 1
        for chunk in completion:
            print(f"chunk: {chunk}")
    except litellm.RateLimitError as e:
        pass
@pytest.mark.asyncio