fix(slack_alerting.py): use in-memory cache for checking request status

2025-04-26 11:14:04 +00:00 · 2024-07-02 13:01:59 -07:00 · 2024-07-02 13:01:59 -07:00 · d09a78d7fd
commit d09a78d7fd
parent ffc173a94c
4 changed files with 106 additions and 36 deletions
--- a/litellm/proxy/utils.py
+++ b/litellm/proxy/utils.py
@ -272,6 +272,16 @@ class ProxyLogging:
                callback_list=callback_list
            )

+    async def update_request_status(
+        self, litellm_call_id: str, status: Literal["success", "fail"]
+    ):
+        await self.internal_usage_cache.async_set_cache(
+            key="request_status:{}".format(litellm_call_id),
+            value=status,
+            local_only=True,
+            ttl=3600,
+        )
+
    # The actual implementation of the function
    async def pre_call_hook(
        self,
@ -560,6 +570,9 @@ class ProxyLogging:
        """

        ### ALERTING ###
+        await self.update_request_status(
+            litellm_call_id=request_data.get("litellm_call_id", ""), status="fail"
+        )
        if "llm_exceptions" in self.alert_types and not isinstance(
            original_exception, HTTPException
        ):
@ -611,6 +624,7 @@ class ProxyLogging:
        Covers:
        1. /chat/completions
        """
+
        for callback in litellm.callbacks:
            try:
                _callback: Optional[CustomLogger] = None