diff --git a/litellm/router.py b/litellm/router.py index 510d179bab..4ecd41c921 100644 --- a/litellm/router.py +++ b/litellm/router.py @@ -1972,6 +1972,8 @@ class Router: response = await original_function(*args, **kwargs) return response except Exception as e: + num_retries = None + current_attempt = None original_exception = e """ Retry Logic @@ -2245,6 +2247,8 @@ class Router: response = original_function(*args, **kwargs) return response except Exception as e: + num_retries = None + current_attempt = None original_exception = e ### CHECK IF RATE LIMIT / CONTEXT WINDOW ERROR _healthy_deployments = self._get_healthy_deployments( @@ -2299,6 +2303,7 @@ class Router: if type(original_exception) in litellm.LITELLM_EXCEPTION_TYPES: original_exception.max_retries = num_retries original_exception.num_retries = current_attempt + raise original_exception ### HELPER FUNCTIONS