(feat) support timeout on bedrock

2025-04-26 19:24:27 +00:00 · 2024-02-09 17:42:17 -08:00 · 2024-02-09 17:42:17 -08:00 · cd9005d6e6
commit cd9005d6e6
parent 43232012d7
2 changed files with 57 additions and 2 deletions
--- a/litellm/router.py
+++ b/litellm/router.py
@ -389,7 +389,7 @@ class Router:
            model_name = data["model"]
            for k, v in self.default_litellm_params.items():
                if (
-                    k not in kwargs
+                    k not in kwargs and v is not None
                ):  # prioritize model-specific params > default router params
                    kwargs[k] = v
                elif k == "metadata":
@ -409,13 +409,24 @@ class Router:
            else:
                model_client = potential_model_client
            self.total_calls[model_name] += 1
            timeout = (
                data.get(
                    "timeout", None
                )  # timeout set on litellm_params for this deployment
                or self.timeout  # timeout set on router
                or kwargs.get(
                    "timeout", None
                )  # this uses default_litellm_params when nothing is set
            )
            response = await litellm.acompletion(
                **{
                    **data,
                    "messages": messages,
                    "caching": self.cache_responses,
                    "client": model_client,
-                    "timeout": self.timeout,
+                    "timeout": timeout,
                    **kwargs,
                }
            )
--- a/litellm/tests/test_router_timeout.py
+++ b/litellm/tests/test_router_timeout.py
@ -85,3 +85,47 @@ def test_router_timeouts():
        print("Response:", response)
        print("********** TOKENS USED SO FAR = ", total_tokens_used)
@pytest.mark.asyncio
 async def test_router_timeouts_bedrock():
    import openai
    # Model list for OpenAI and Anthropic models
    model_list = [
        {
            "model_name": "bedrock",
            "litellm_params": {
                "model": "bedrock/anthropic.claude-instant-v1",
                "timeout": 0.001,
            },
            "tpm": 80000,
        },
    ]
    # Configure router
    router = Router(
        model_list=model_list,
        routing_strategy="usage-based-routing",
        debug_level="DEBUG",
        set_verbose=True,
    )
    litellm.set_verbose = True
    try:
        response = await router.acompletion(
            model="bedrock",
            messages=[{"role": "user", "content": "hello, who are u"}],
        )
        print(response)
        pytest.fail("Did not raise error `openai.APITimeoutError`")
    except openai.APITimeoutError as e:
        print(
            "Passed: Raised correct exception. Got openai.APITimeoutError\nGood Job", e
        )
        print(type(e))
        pass
    except Exception as e:
        pytest.fail(
            f"Did not raise error `openai.APITimeoutError`. Instead raised error type: {type(e)}, Error: {e}"
        )