(feat) improve health readiness perf

2024-03-16 13:10:04 -07:00 · 2024-03-16 13:10:04 -07:00 · 61f129b9ab
commit 61f129b9ab
parent c17e721278
1 changed files with 52 additions and 31 deletions
--- a/litellm/proxy/proxy_server.py
+++ b/litellm/proxy/proxy_server.py
@ -7271,6 +7271,25 @@ async def health_endpoint(
        raise e
 db_health_cache = {"status": "unknown", "last_updated": datetime.now()}
 def _db_health_readiness_check():
    global db_health_cache, prisma_client
    # Note - Intentionally don't try/except this so it raises an exception when it fails
    # if timedelta is less than 2 minutes return DB Status
    if (
        db_health_cache["status"] != "unknown"
        and db_health_cache["last_updated"] + timedelta(minutes=2) > datetime.now()
    ):
        return db_health_cache
    prisma_client.health_check()
    db_health_cache = {"status": "connected", "last_updated": datetime.now()}
    return db_health_cache
@router.get(
    "/health/readiness",
    tags=["health"],
@ -7280,41 +7299,43 @@ async def health_readiness():
    """
    Unprotected endpoint for checking if worker can receive requests
    """
-    global prisma_client
+    try:
        cache_type = None
        if litellm.cache is not None:
            from litellm.caching import RedisSemanticCache
-    cache_type = None
+            cache_type = litellm.cache.type
    if litellm.cache is not None:
        from litellm.caching import RedisSemanticCache
-        cache_type = litellm.cache.type
+            if isinstance(litellm.cache.cache, RedisSemanticCache):
                # ping the cache
                # TODO: @ishaan-jaff - we should probably not ping the cache on every /health/readiness check
                try:
                    index_info = await litellm.cache.cache._index_info()
                except Exception as e:
                    index_info = "index does not exist - error: " + str(e)
                cache_type = {"type": cache_type, "index_info": index_info}
-        if isinstance(litellm.cache.cache, RedisSemanticCache):
+        if prisma_client is not None:  # if db passed in, check if it's connected
-            # ping the cache
+            db_health_status = _db_health_readiness_check()
            try:
                index_info = await litellm.cache.cache._index_info()
            except Exception as e:
                index_info = "index does not exist - error: " + str(e)
            cache_type = {"type": cache_type, "index_info": index_info}
    if prisma_client is not None:  # if db passed in, check if it's connected
        await prisma_client.health_check()  # test the db connection
        response_object = {"db": "connected"}
-        return {
+            return {
-            "status": "healthy",
+                "status": "healthy",
-            "db": "connected",
+                "db": "connected",
-            "cache": cache_type,
+                "cache": cache_type,
-            "litellm_version": version,
+                "litellm_version": version,
-            "success_callbacks": litellm.success_callback,
+                "success_callbacks": litellm.success_callback,
-        }
+                **db_health_status,
-    else:
+            }
-        return {
+        else:
-            "status": "healthy",
+            return {
-            "db": "Not connected",
+                "status": "healthy",
-            "cache": cache_type,
+                "db": "Not connected",
-            "litellm_version": version,
+                "cache": cache_type,
-            "success_callbacks": litellm.success_callback,
+                "litellm_version": version,
-        }
+                "success_callbacks": litellm.success_callback,
-    raise HTTPException(status_code=503, detail="Service Unhealthy")
+            }
    except Exception as e:
        raise HTTPException(status_code=503, detail=f"Service Unhealthy ({str(e)})")
@router.get(