fix(router.py): unify retry timeout logic across sync + async function_with_retries

2025-04-27 11:43:54 +00:00 · 2024-04-30 15:23:19 -07:00 · 2024-04-30 15:23:19 -07:00 · 87ff26ff27
commit 87ff26ff27
parent 285a3733a9
2 changed files with 119 additions and 65 deletions
--- a/litellm/tests/test_router.py
+++ b/litellm/tests/test_router.py
@ -104,6 +104,42 @@ def test_router_timeout_init(timeout, ssl_verify):
        )


+@pytest.mark.parametrize("sync_mode", [False, True])
+@pytest.mark.asyncio
+async def test_router_retries(sync_mode):
+    """
+    - make sure retries work as expected
+    """
+    model_list = [
+        {
+            "model_name": "gpt-3.5-turbo",
+            "litellm_params": {"model": "gpt-3.5-turbo", "api_key": "bad-key"},
+        },
+        {
+            "model_name": "gpt-3.5-turbo",
+            "litellm_params": {
+                "model": "azure/chatgpt-v-2",
+                "api_key": os.getenv("AZURE_API_KEY"),
+                "api_base": os.getenv("AZURE_API_BASE"),
+                "api_version": os.getenv("AZURE_API_VERSION"),
+            },
+        },
+    ]
+
+    router = Router(model_list=model_list, num_retries=2)
+
+    if sync_mode:
+        router.completion(
+            model="gpt-3.5-turbo",
+            messages=[{"role": "user", "content": "Hey, how's it going?"}],
+        )
+    else:
+        await router.acompletion(
+            model="gpt-3.5-turbo",
+            messages=[{"role": "user", "content": "Hey, how's it going?"}],
+        )
+
+
@pytest.mark.parametrize(
    "mistral_api_base",
    [