diff --git a/litellm/router.py b/litellm/router.py index 09b24e1d0..510d179ba 100644 --- a/litellm/router.py +++ b/litellm/router.py @@ -2295,6 +2295,10 @@ class Router: healthy_deployments=_healthy_deployments, ) time.sleep(_timeout) + + if type(original_exception) in litellm.LITELLM_EXCEPTION_TYPES: + original_exception.max_retries = num_retries + original_exception.num_retries = current_attempt raise original_exception ### HELPER FUNCTIONS