feat(proxy/utils.py): return api base for request hanging alerts

2024-04-06 15:58:53 -07:00 · 2024-04-06 15:58:53 -07:00 · 6110d32b1c
commit 6110d32b1c
parent b49e47b634
7 changed files with 180 additions and 15 deletions
--- a/litellm/proxy/proxy_server.py
+++ b/litellm/proxy/proxy_server.py
@ -3441,13 +3441,15 @@ async def chat_completion(
        )  # run the moderation check in parallel to the actual llm api call
        response = responses[1]

-        # Post Call Processing
-        data["litellm_status"] = "success"  # used for alerting
-
        hidden_params = getattr(response, "_hidden_params", {}) or {}
        model_id = hidden_params.get("model_id", None) or ""
        cache_key = hidden_params.get("cache_key", None) or ""

+        # Post Call Processing
+        if llm_router is not None:
+            data["deployment"] = llm_router.get_deployment(model_id=model_id)
+        data["litellm_status"] = "success"  # used for alerting
+
        if (
            "stream" in data and data["stream"] == True
        ):  # use generate_responses to stream responses