Merge pull request #3962 from BerriAI/litellm_return_num_rets_max_exceptions

[Feat] return `num_retries` and `max_retries` in exceptions
2025-04-25 10:44:24 +00:00 · 2024-06-01 17:48:38 -07:00 · 2024-06-01 17:48:38 -07:00 · fb49d036fb
commit fb49d036fb
parent edf296fb5b d4378143f1
4 changed files with 355 additions and 9 deletions
--- a/litellm/router.py
+++ b/litellm/router.py
@ -2059,6 +2059,8 @@ class Router:
            response = await original_function(*args, **kwargs)
            return response
        except Exception as e:
+            num_retries = None
+            current_attempt = None
            original_exception = e
            """
            Retry Logic
@ -2128,11 +2130,10 @@ class Router:
                    )
                    await asyncio.sleep(_timeout)

-            try:
-                cooldown_deployments = await self._async_get_cooldown_deployments()
-                original_exception.message += f"\nNumber Retries = {current_attempt + 1}, Max Retries={num_retries}\nCooldown Deployments={cooldown_deployments}"
-            except:
-                pass
+            if type(original_exception) in litellm.LITELLM_EXCEPTION_TYPES:
+                original_exception.max_retries = num_retries
+                original_exception.num_retries = current_attempt
+
            raise original_exception

    def should_retry_this_error(
@ -2333,6 +2334,8 @@ class Router:
            response = original_function(*args, **kwargs)
            return response
        except Exception as e:
+            num_retries = None
+            current_attempt = None
            original_exception = e
            ### CHECK IF RATE LIMIT / CONTEXT WINDOW ERROR
            _healthy_deployments = self._get_healthy_deployments(
@ -2383,6 +2386,11 @@ class Router:
                        healthy_deployments=_healthy_deployments,
                    )
                    time.sleep(_timeout)
+
+            if type(original_exception) in litellm.LITELLM_EXCEPTION_TYPES:
+                original_exception.max_retries = num_retries
+                original_exception.num_retries = current_attempt
+
            raise original_exception

    ### HELPER FUNCTIONS