fix exception mapping for vertex ai

2024-06-18 08:38:36 -07:00 · 2024-06-18 08:38:36 -07:00 · 8f3bd0780b
commit 8f3bd0780b
parent fdb9b24b9f
1 changed files with 17 additions and 0 deletions
--- a/litellm/utils.py
+++ b/litellm/utils.py
@ -6297,6 +6297,7 @@ def exception_type(
                    )
                elif (
                    "429 Quota exceeded" in error_str
                    or "Quota exceeded for" in error_str
                    or "IndexError: list index out of range" in error_str
                    or "429 Unable to submit request because the service is temporarily out of capacity."
                    in error_str
@ -6339,6 +6340,22 @@ def exception_type(
                                ),
                            ),
                        )
                    if original_exception.status_code == 429:
                        exception_mapping_worked = True
                        raise RateLimitError(
                            message=f"litellm.RateLimitError: VertexAIException - {error_str}",
                            model=model,
                            llm_provider="vertex_ai",
                            litellm_debug_info=extra_information,
                            response=httpx.Response(
                                status_code=429,
                                request=httpx.Request(
                                    method="POST",
                                    url=" https://cloud.google.com/vertex-ai/",
                                ),
                            ),
                        )
                    if original_exception.status_code == 500:
                        exception_mapping_worked = True
                        raise litellm.InternalServerError(