return llm_provider as part of the exception

2025-04-26 11:14:04 +00:00 · 2023-08-17 11:31:34 -07:00 · 2023-08-17 11:31:34 -07:00 · b91c69ffde
commit b91c69ffde
parent 2cfd4dd871
6 changed files with 75 additions and 31 deletions
--- a/litellm/utils.py
+++ b/litellm/utils.py
@ -5,13 +5,13 @@ import litellm, openai
 import random, uuid, requests
 import datetime, time
 import tiktoken
-from importlib_metadata import DistributionNotFound, VersionConflict
 encoding = tiktoken.get_encoding("cl100k_base")
 from .integrations.helicone import HeliconeLogger
 from .integrations.aispend import AISpendLogger
 from .integrations.berrispend import BerriSpendLogger
 from .integrations.supabase import Supabase
-from openai.error import AuthenticationError, InvalidRequestError, RateLimitError, ServiceUnavailableError, OpenAIError
+from openai.error import OpenAIError as OriginalError
+from .exceptions import AuthenticationError, InvalidRequestError, RateLimitError, ServiceUnavailableError, OpenAIError
 ####### ENVIRONMENT VARIABLES ###################
 dotenv.load_dotenv() # Loading env variables using dotenv
 sentry_sdk_instance = None
@ -102,18 +102,14 @@ def install_and_import(package: str):
    try:
        # Import the module 
        module = importlib.import_module(package)
-    except (ModuleNotFoundError, ImportError):
+    except ImportError:
        print_verbose(f"{package} is not installed. Installing...")
        subprocess.call([sys.executable, "-m", "pip", "install", package])
        globals()[package] = importlib.import_module(package)
-    except (DistributionNotFound, ImportError):
-        print_verbose(f"{package} is not installed. Installing...")
-        subprocess.call([sys.executable, "-m", "pip", "install", package])
-        globals()[package] = importlib.import_module(package)
-    except VersionConflict as vc:
-        print_verbose(f"Detected version conflict for {package}. Upgrading...")
-        subprocess.call([sys.executable, "-m", "pip", "install", "--upgrade", package])
-        globals()[package] = importlib.import_module(package)
+    # except VersionConflict as vc:
+    #     print_verbose(f"Detected version conflict for {package}. Upgrading...")
+    #     subprocess.call([sys.executable, "-m", "pip", "install", "--upgrade", package])
+    #     globals()[package] = importlib.import_module(package)
    finally:
        if package not in globals().keys():
            globals()[package] = importlib.import_module(package)
@ -687,8 +683,13 @@ def exception_type(model, original_exception, custom_llm_provider):
    global user_logger_fn
    exception_mapping_worked = False
    try:
-      if isinstance(original_exception, OpenAIError):
+      if isinstance(original_exception, OriginalError):
          # Handle the OpenAIError
+          exception_mapping_worked = True
+          if custom_llm_provider == "azure":
+            original_exception.llm_provider = "azure"
+          else:
+            original_exception.llm_provider = "openai"
          raise original_exception
      elif model:
        error_str = str(original_exception)
@ -702,49 +703,49 @@ def exception_type(model, original_exception, custom_llm_provider):
            print_verbose(f"status_code: {original_exception.status_code}")
            if original_exception.status_code == 401:
              exception_mapping_worked = True
-              raise AuthenticationError(f"AnthropicException - {original_exception.message}")
+              raise AuthenticationError(message=f"AnthropicException - {original_exception.message}", llm_provider="anthropic")
            elif original_exception.status_code == 400:
              exception_mapping_worked = True
-              raise InvalidRequestError(f"AnthropicException - {original_exception.message}", f"{model}")
+              raise InvalidRequestError(message=f"AnthropicException - {original_exception.message}", model=model, llm_provider="anthropic")
            elif original_exception.status_code == 429:
              exception_mapping_worked = True
-              raise RateLimitError(f"AnthropicException - {original_exception.message}")
+              raise RateLimitError(message=f"AnthropicException - {original_exception.message}", llm_provider="anthropic")
          elif "Could not resolve authentication method. Expected either api_key or auth_token to be set." in error_str:
            exception_mapping_worked = True
-            raise AuthenticationError(f"AnthropicException - {error_str}")
+            raise AuthenticationError(message=f"AnthropicException - {original_exception.message}", llm_provider="anthropic")
        elif "replicate" in model:
          if "Incorrect authentication token" in error_str:
            exception_mapping_worked = True
-            raise AuthenticationError(f"ReplicateException - {error_str}")
+            raise AuthenticationError(message=f"ReplicateException - {error_str}", llm_provider="replicate")
          elif exception_type == "ModelError":
            exception_mapping_worked = True
-            raise InvalidRequestError(f"ReplicateException - {error_str}", f"{model}")
+            raise InvalidRequestError(message=f"ReplicateException - {error_str}", model=model, llm_provider="replicate")
          elif "Request was throttled" in error_str:
            exception_mapping_worked = True
-            raise RateLimitError(f"ReplicateException - {error_str}")
+            raise RateLimitError(message=f"ReplicateException - {error_str}", llm_provider="replicate")
          elif exception_type == "ReplicateError": ## ReplicateError implies an error on Replicate server side, not user side
-            raise ServiceUnavailableError(f"ReplicateException - {error_str}")
+            raise ServiceUnavailableError(message=f"ReplicateException - {error_str}", llm_provider="replicate")
        elif model == "command-nightly": #Cohere
          if "invalid api token" in error_str or "No API key provided." in error_str:
            exception_mapping_worked = True
-            raise AuthenticationError(f"CohereException - {error_str}")
+            raise AuthenticationError(message=f"CohereException - {original_exception.message}", llm_provider="cohere")
          elif "too many tokens" in error_str:
            exception_mapping_worked = True
-            raise InvalidRequestError(f"CohereException - {error_str}", f"{model}")
+            raise InvalidRequestError(message=f"CohereException - {original_exception.message}", model=model, llm_provider="cohere")
          elif "CohereConnectionError" in exception_type: # cohere seems to fire these errors when we load test it (1k+ messages / min)
            exception_mapping_worked = True
-            raise RateLimitError(f"CohereException - {original_exception.message}")
+            raise RateLimitError(message=f"CohereException - {original_exception.message}", llm_provider="cohere")
        elif custom_llm_provider == "huggingface":
           if hasattr(original_exception, "status_code"):
              if original_exception.status_code == 401:
                exception_mapping_worked = True
-                raise AuthenticationError(f"HuggingfaceException - {original_exception.message}")
+                raise AuthenticationError(message=f"HuggingfaceException - {original_exception.message}", llm_provider="huggingface")
              elif original_exception.status_code == 400:
                exception_mapping_worked = True
-                raise InvalidRequestError(f"HuggingfaceException - {original_exception.message}", f"{model}")
+                raise InvalidRequestError(message=f"HuggingfaceException - {original_exception.message}", model=model, llm_provider="huggingface")
              elif original_exception.status_code == 429:
                exception_mapping_worked = True
-                raise RateLimitError(f"HuggingfaceException - {original_exception.message}")
+                raise RateLimitError(message=f"HuggingfaceException - {original_exception.message}", llm_provider="huggingface")
        raise original_exception # base case - return the original exception
      else:
        raise original_exception