fix(router.py): cooldown deployments, for 401 errors

2025-04-25 10:44:24 +00:00 · 2024-04-30 17:54:00 -07:00 · 2024-04-30 17:54:00 -07:00 · 1baad80c7d
commit 1baad80c7d
parent 8ee51a96f4
6 changed files with 165 additions and 14 deletions
--- a/litellm/main.py
+++ b/litellm/main.py
@ -387,6 +387,19 @@ def mock_completion(
        - If 'stream' is True, it returns a response that mimics the behavior of a streaming completion.
    """
    try:
+        ## LOGGING
+        logging.pre_call(
+            input=messages,
+            api_key="mock-key",
+        )
+        if isinstance(mock_response, Exception):
+            raise litellm.APIError(
+                status_code=500,  # type: ignore
+                message=str(mock_response),
+                llm_provider="openai",  # type: ignore
+                model=model,  # type: ignore
+                request=httpx.Request(method="POST", url="https://api.openai.com/v1/"),
+            )
        model_response = ModelResponse(stream=stream)
        if stream is True:
            # don't try to access stream object,