(Feat) - Allow viewing Request/Response Logs stored in GCS Bucket (#8449)

* BaseRequestResponseFetchFromCustomLogger * get_active_base_request_response_fetch_from_custom_logger * get_request_response_payload * ui_view_request_response_for_request_id * fix uiSpendLogDetailsCall * fix get_request_response_payload * ui fix RequestViewer * use 1 class AdditionalLoggingUtils * ui_view_request_response_for_request_id * cache the prefetch logs details * refactor prefetch * test view request/resp logs * fix code quality * fix get_request_response_payload * uninstall posthog prevent it from being added in ci/cd * fix posthog * fix traceloop test * fix linting error
2025-04-25 10:44:24 +00:00 · 2025-02-10 20:38:55 -08:00 · 2025-02-10 20:38:55 -08:00 · 00c596a852
commit 00c596a852
parent 64a4229606
13 changed files with 706 additions and 201 deletions
--- a/litellm/integrations/additional_logging_utils.py
+++ b/litellm/integrations/additional_logging_utils.py
@ -0,0 +1,36 @@
 """
 Base class for Additional Logging Utils for CustomLoggers 
 - Health Check for the logging util
 - Get Request / Response Payload for the logging util
 """
 from abc import ABC, abstractmethod
 from datetime import datetime
 from typing import Optional
 from litellm.types.integrations.base_health_check import IntegrationHealthCheckStatus
 class AdditionalLoggingUtils(ABC):
    def __init__(self):
        super().__init__()
    @abstractmethod
    async def async_health_check(self) -> IntegrationHealthCheckStatus:
        """
        Check if the service is healthy
        """
        pass
    @abstractmethod
    async def get_request_response_payload(
        self,
        request_id: str,
        start_time_utc: Optional[datetime],
        end_time_utc: Optional[datetime],
    ) -> Optional[dict]:
        """
        Get the request and response payload for a given `request_id`
        """
        return None
--- a/litellm/integrations/base_health_check.py
+++ b/litellm/integrations/base_health_check.py
@ -1,19 +0,0 @@
 """
 Base class for health check integrations
 """
 from abc import ABC, abstractmethod
 from litellm.types.integrations.base_health_check import IntegrationHealthCheckStatus
 class HealthCheckIntegration(ABC):
    def __init__(self):
        super().__init__()
    @abstractmethod
    async def async_health_check(self) -> IntegrationHealthCheckStatus:
        """
        Check if the service is healthy
        """
        pass
--- a/litellm/integrations/datadog/datadog.py
+++ b/litellm/integrations/datadog/datadog.py
@ -38,14 +38,14 @@ from litellm.types.integrations.datadog import *
 from litellm.types.services import ServiceLoggerPayload
 from litellm.types.utils import StandardLoggingPayload
-from ..base_health_check import HealthCheckIntegration
+from ..additional_logging_utils import AdditionalLoggingUtils
 DD_MAX_BATCH_SIZE = 1000  # max number of logs DD API can accept
 class DataDogLogger(
    CustomBatchLogger,
-    HealthCheckIntegration,
+    AdditionalLoggingUtils,
 ):
    # Class variables or attributes
    def __init__(
@ -543,3 +543,13 @@ class DataDogLogger(
                status="unhealthy",
                error_message=str(e),
            )
    async def get_request_response_payload(
        self,
        request_id: str,
        start_time_utc: Optional[datetimeObj],
        end_time_utc: Optional[datetimeObj],
    ) -> Optional[dict]:
        raise NotImplementedError(
            "Datdog Integration for getting request/response payloads not implemented as yet"
        )
--- a/litellm/integrations/gcs_bucket/gcs_bucket.py
+++ b/litellm/integrations/gcs_bucket/gcs_bucket.py
@ -1,12 +1,16 @@
 import asyncio
 import json
 import os
 import uuid
-from datetime import datetime
+from datetime import datetime, timedelta, timezone
 from typing import TYPE_CHECKING, Any, Dict, List, Optional
 from urllib.parse import quote
 from litellm._logging import verbose_logger
 from litellm.integrations.additional_logging_utils import AdditionalLoggingUtils
 from litellm.integrations.gcs_bucket.gcs_bucket_base import GCSBucketBase
 from litellm.proxy._types import CommonProxyErrors
 from litellm.types.integrations.base_health_check import IntegrationHealthCheckStatus
 from litellm.types.integrations.gcs_bucket import *
 from litellm.types.utils import StandardLoggingPayload
@ -20,7 +24,7 @@ GCS_DEFAULT_BATCH_SIZE = 2048
 GCS_DEFAULT_FLUSH_INTERVAL_SECONDS = 20
-class GCSBucketLogger(GCSBucketBase):
+class GCSBucketLogger(GCSBucketBase, AdditionalLoggingUtils):
    def __init__(self, bucket_name: Optional[str] = None) -> None:
        from litellm.proxy.proxy_server import premium_user
@ -39,6 +43,7 @@ class GCSBucketLogger(GCSBucketBase):
            batch_size=self.batch_size,
            flush_interval=self.flush_interval,
        )
        AdditionalLoggingUtils.__init__(self)
        if premium_user is not True:
            raise ValueError(
@ -150,11 +155,16 @@ class GCSBucketLogger(GCSBucketBase):
        """
        Get the object name to use for the current payload
        """
-        current_date = datetime.now().strftime("%Y-%m-%d")
+        current_date = self._get_object_date_from_datetime(datetime.now(timezone.utc))
        if logging_payload.get("error_str", None) is not None:
-            object_name = f"{current_date}/failure-{uuid.uuid4().hex}"
+            object_name = self._generate_failure_object_name(
                request_date_str=current_date,
            )
        else:
-            object_name = f"{current_date}/{response_obj.get('id', '')}"
+            object_name = self._generate_success_object_name(
                request_date_str=current_date,
                response_id=response_obj.get("id", ""),
            )
        # used for testing
        _litellm_params = kwargs.get("litellm_params", None) or {}
@ -163,3 +173,65 @@ class GCSBucketLogger(GCSBucketBase):
            object_name = _metadata["gcs_log_id"]
        return object_name
    async def get_request_response_payload(
        self,
        request_id: str,
        start_time_utc: Optional[datetime],
        end_time_utc: Optional[datetime],
    ) -> Optional[dict]:
        """
        Get the request and response payload for a given `request_id`
        Tries current day, next day, and previous day until it finds the payload
        """
        if start_time_utc is None:
            raise ValueError(
                "start_time_utc is required for getting a payload from GCS Bucket"
            )
        # Try current day, next day, and previous day
        dates_to_try = [
            start_time_utc,
            start_time_utc + timedelta(days=1),
            start_time_utc - timedelta(days=1),
        ]
        date_str = None
        for date in dates_to_try:
            try:
                date_str = self._get_object_date_from_datetime(datetime_obj=date)
                object_name = self._generate_success_object_name(
                    request_date_str=date_str,
                    response_id=request_id,
                )
                encoded_object_name = quote(object_name, safe="")
                response = await self.download_gcs_object(encoded_object_name)
                if response is not None:
                    loaded_response = json.loads(response)
                    return loaded_response
            except Exception as e:
                verbose_logger.debug(
                    f"Failed to fetch payload for date {date_str}: {str(e)}"
                )
                continue
        return None
    def _generate_success_object_name(
        self,
        request_date_str: str,
        response_id: str,
    ) -> str:
        return f"{request_date_str}/{response_id}"
    def _generate_failure_object_name(
        self,
        request_date_str: str,
    ) -> str:
        return f"{request_date_str}/failure-{uuid.uuid4().hex}"
    def _get_object_date_from_datetime(self, datetime_obj: datetime) -> str:
        return datetime_obj.strftime("%Y-%m-%d")
    async def async_health_check(self) -> IntegrationHealthCheckStatus:
        raise NotImplementedError("GCS Bucket does not support health check")
--- a/litellm/litellm_core_utils/logging_callback_manager.py
+++ b/litellm/litellm_core_utils/logging_callback_manager.py
@ -1,7 +1,8 @@
-from typing import Callable, List, Union
+from typing import Callable, List, Set, Union
 import litellm
 from litellm._logging import verbose_logger
 from litellm.integrations.additional_logging_utils import AdditionalLoggingUtils
 from litellm.integrations.custom_logger import CustomLogger
@ -220,3 +221,36 @@ class LoggingCallbackManager:
        litellm._async_success_callback = []
        litellm._async_failure_callback = []
        litellm.callbacks = []
    def _get_all_callbacks(self) -> List[Union[CustomLogger, Callable, str]]:
        """
        Get all callbacks from litellm.callbacks, litellm.success_callback, litellm.failure_callback, litellm._async_success_callback, litellm._async_failure_callback
        """
        return (
            litellm.callbacks
            + litellm.success_callback
            + litellm.failure_callback
            + litellm._async_success_callback
            + litellm._async_failure_callback
        )
    def get_active_additional_logging_utils_from_custom_logger(
        self,
    ) -> Set[AdditionalLoggingUtils]:
        """
        Get all custom loggers that are instances of the given class type
        Args:
            class_type: The class type to match against (e.g., AdditionalLoggingUtils)
        Returns:
            Set[CustomLogger]: Set of custom loggers that are instances of the given class type
        """
        all_callbacks = self._get_all_callbacks()
        matched_callbacks: Set[AdditionalLoggingUtils] = set()
        for callback in all_callbacks:
            if isinstance(callback, CustomLogger) and isinstance(
                callback, AdditionalLoggingUtils
            ):
                matched_callbacks.add(callback)
        return matched_callbacks
--- a/litellm/proxy/proxy_config.yaml
+++ b/litellm/proxy/proxy_config.yaml
@ -5,8 +5,11 @@ model_list:
      api_key: my-fake-key
      api_base: https://exampleopenaiendpoint-production.up.railway.app/
-litellm_settings:
+
-  cache: True
+general_settings:
-  cache_params:
+  store_model_in_db: true
-    type: redis
+
 litellm_settings:
  callbacks: ["gcs_bucket"]
--- a/litellm/proxy/spend_tracking/spend_management_endpoints.py
+++ b/litellm/proxy/spend_tracking/spend_management_endpoints.py
@ -2,6 +2,7 @@
 import collections
 import os
 from datetime import datetime, timedelta, timezone
 from functools import lru_cache
 from typing import TYPE_CHECKING, Any, List, Optional
 import fastapi
@ -1759,6 +1760,56 @@ async def ui_view_spend_logs(  # noqa: PLR0915
        raise handle_exception_on_proxy(e)
@lru_cache(maxsize=128)
@router.get(
    "/spend/logs/ui/{request_id}",
    tags=["Budget & Spend Tracking"],
    dependencies=[Depends(user_api_key_auth)],
    include_in_schema=False,
 )
 async def ui_view_request_response_for_request_id(
    request_id: str,
    start_date: Optional[str] = fastapi.Query(
        default=None,
        description="Time from which to start viewing key spend",
    ),
    end_date: Optional[str] = fastapi.Query(
        default=None,
        description="Time till which to view key spend",
    ),
 ):
    """
    View request / response for a specific request_id
    - goes through all callbacks, checks if any of them have a @property -> has_request_response_payload
    - if so, it will return the request and response payload
    """
    custom_loggers = (
        litellm.logging_callback_manager.get_active_additional_logging_utils_from_custom_logger()
    )
    start_date_obj: Optional[datetime] = None
    end_date_obj: Optional[datetime] = None
    if start_date is not None:
        start_date_obj = datetime.strptime(start_date, "%Y-%m-%d %H:%M:%S").replace(
            tzinfo=timezone.utc
        )
    if end_date is not None:
        end_date_obj = datetime.strptime(end_date, "%Y-%m-%d %H:%M:%S").replace(
            tzinfo=timezone.utc
        )
    for custom_logger in custom_loggers:
        payload = await custom_logger.get_request_response_payload(
            request_id=request_id,
            start_time_utc=start_date_obj,
            end_time_utc=end_date_obj,
        )
        if payload is not None:
            return payload
    return None
@router.get(
    "/spend/logs",
    tags=["Budget & Spend Tracking"],
--- a/tests/local_testing/test_traceloop.py
+++ b/tests/local_testing/test_traceloop.py
@ -11,6 +11,7 @@ sys.path.insert(0, os.path.abspath("../.."))
@pytest.fixture()
@pytest.mark.skip(reason="Traceloop use `otel` integration instead")
 def exporter():
    from traceloop.sdk import Traceloop
@ -27,6 +28,7 @@ def exporter():
@pytest.mark.parametrize("model", ["claude-3-5-haiku-20241022", "gpt-3.5-turbo"])
@pytest.mark.skip(reason="Traceloop use `otel` integration instead")
 def test_traceloop_logging(exporter, model):
    litellm.completion(
        model=model,
--- a/tests/logging_callback_tests/test_view_request_resp_logs.py
+++ b/tests/logging_callback_tests/test_view_request_resp_logs.py
@ -0,0 +1,208 @@
 import io
 import os
 import sys
 sys.path.insert(0, os.path.abspath("../.."))
 import asyncio
 import json
 import logging
 import tempfile
 import uuid
 import json
 from datetime import datetime, timedelta, timezone
 from datetime import datetime
 import pytest
 import litellm
 from litellm import completion
 from litellm._logging import verbose_logger
 from litellm.integrations.gcs_bucket.gcs_bucket import (
    GCSBucketLogger,
    StandardLoggingPayload,
 )
 from litellm.types.utils import StandardCallbackDynamicParams
 # This is the response payload that GCS would return.
 mock_response_data = {
    "id": "chatcmpl-9870a859d6df402795f75dc5fca5b2e0",
    "trace_id": None,
    "call_type": "acompletion",
    "cache_hit": None,
    "stream": True,
    "status": "success",
    "custom_llm_provider": "openai",
    "saved_cache_cost": 0.0,
    "startTime": 1739235379.683053,
    "endTime": 1739235379.84533,
    "completionStartTime": 1739235379.84533,
    "response_time": 0.1622769832611084,
    "model": "my-fake-model",
    "metadata": {
        "user_api_key_hash": "88dc28d0f030c55ed4ab77ed8faf098196cb1c05df778539800c9f1243fe6b4b",
        "user_api_key_alias": None,
        "user_api_key_team_id": None,
        "user_api_key_org_id": None,
        "user_api_key_user_id": "default_user_id",
        "user_api_key_team_alias": None,
        "spend_logs_metadata": None,
        "requester_ip_address": "127.0.0.1",
        "requester_metadata": {},
        "user_api_key_end_user_id": None,
        "prompt_management_metadata": None,
    },
    "cache_key": None,
    "response_cost": 3.7500000000000003e-05,
    "total_tokens": 21,
    "prompt_tokens": 9,
    "completion_tokens": 12,
    "request_tags": [],
    "end_user": "",
    "api_base": "https://exampleopenaiendpoint-production.up.railway.app",
    "model_group": "fake-openai-endpoint",
    "model_id": "b68d56d76b0c24ac9462ab69541e90886342508212210116e300441155f37865",
    "requester_ip_address": "127.0.0.1",
    "messages": [
        {"role": "user", "content": [{"type": "text", "text": "very gm to u"}]}
    ],
    "response": {
        "id": "chatcmpl-9870a859d6df402795f75dc5fca5b2e0",
        "created": 1677652288,
        "model": "gpt-3.5-turbo-0301",
        "object": "chat.completion",
        "system_fingerprint": "fp_44709d6fcb",
        "choices": [
            {
                "finish_reason": "stop",
                "index": 0,
                "message": {
                    "content": "\n\nHello there, how may I assist you today?",
                    "role": "assistant",
                    "tool_calls": None,
                    "function_call": None,
                    "refusal": None,
                },
            }
        ],
        "usage": {
            "completion_tokens": 12,
            "prompt_tokens": 9,
            "total_tokens": 21,
            "completion_tokens_details": None,
            "prompt_tokens_details": None,
        },
        "service_tier": None,
    },
    "model_parameters": {"stream": False, "max_retries": 0, "extra_body": {}},
    "hidden_params": {
        "model_id": "b68d56d76b0c24ac9462ab69541e90886342508212210116e300441155f37865",
        "cache_key": None,
        "api_base": "https://exampleopenaiendpoint-production.up.railway.app/",
        "response_cost": 3.7500000000000003e-05,
        "additional_headers": {},
        "litellm_overhead_time_ms": 2.126,
    },
    "model_map_information": {
        "model_map_key": "gpt-3.5-turbo-0301",
        "model_map_value": {},
    },
    "error_str": None,
    "error_information": {"error_code": "", "error_class": "", "llm_provider": ""},
    "response_cost_failure_debug_info": None,
    "guardrail_information": None,
 }
@pytest.mark.asyncio
 async def test_get_payload_current_day():
    """
    Verify that the payload is returned when it is found on the current day.
    """
    gcs_logger = GCSBucketLogger()
    # Use January 1, 2024 as the current day
    start_time = datetime(2024, 1, 1, tzinfo=timezone.utc)
    request_id = mock_response_data["id"]
    async def fake_download(object_name: str, **kwargs) -> bytes | None:
        if "2024-01-01" in object_name:
            return json.dumps(mock_response_data).encode("utf-8")
        return None
    gcs_logger.download_gcs_object = fake_download
    payload = await gcs_logger.get_request_response_payload(
        request_id, start_time, None
    )
    assert payload is not None
    assert payload["id"] == request_id
@pytest.mark.asyncio
 async def test_get_payload_next_day():
    """
    Verify that if the payload is not found on the current day,
    but is available on the next day, it is returned.
    """
    gcs_logger = GCSBucketLogger()
    start_time = datetime(2024, 1, 1, tzinfo=timezone.utc)
    request_id = mock_response_data["id"]
    async def fake_download(object_name: str, **kwargs) -> bytes | None:
        if "2024-01-02" in object_name:
            return json.dumps(mock_response_data).encode("utf-8")
        return None
    gcs_logger.download_gcs_object = fake_download
    payload = await gcs_logger.get_request_response_payload(
        request_id, start_time, None
    )
    assert payload is not None
    assert payload["id"] == request_id
@pytest.mark.asyncio
 async def test_get_payload_previous_day():
    """
    Verify that if the payload is not found on the current or next day,
    but is available on the previous day, it is returned.
    """
    gcs_logger = GCSBucketLogger()
    start_time = datetime(2024, 1, 1, tzinfo=timezone.utc)
    request_id = mock_response_data["id"]
    async def fake_download(object_name: str, **kwargs) -> bytes | None:
        if "2023-12-31" in object_name:
            return json.dumps(mock_response_data).encode("utf-8")
        return None
    gcs_logger.download_gcs_object = fake_download
    payload = await gcs_logger.get_request_response_payload(
        request_id, start_time, None
    )
    assert payload is not None
    assert payload["id"] == request_id
@pytest.mark.asyncio
 async def test_get_payload_not_found():
    """
    Verify that if none of the three days contain the payload, None is returned.
    """
    gcs_logger = GCSBucketLogger()
    start_time = datetime(2024, 1, 1, tzinfo=timezone.utc)
    request_id = mock_response_data["id"]
    async def fake_download(object_name: str, **kwargs) -> bytes | None:
        return None
    gcs_logger.download_gcs_object = fake_download
    payload = await gcs_logger.get_request_response_payload(
        request_id, start_time, None
    )
    assert payload is None
--- a/ui/litellm-dashboard/src/components/networking.tsx
+++ b/ui/litellm-dashboard/src/components/networking.tsx
@ -3221,3 +3221,41 @@ export const getGuardrailsList = async (accessToken: String) => {
    throw error;
  }
 };
 export const uiSpendLogDetailsCall = async (
  accessToken: string,
  logId: string,
  start_date: string
 ) => {
  try {
    // Construct base URL
    let url = proxyBaseUrl 
      ? `${proxyBaseUrl}/spend/logs/ui/${logId}?start_date=${encodeURIComponent(start_date)}`
      : `/spend/logs/ui/${logId}?start_date=${encodeURIComponent(start_date)}`;
    console.log("Fetching log details from:", url);
    const response = await fetch(url, {
      method: "GET",
      headers: {
        [globalLitellmHeaderName]: `Bearer ${accessToken}`,
        "Content-Type": "application/json",
      },
    });
    if (!response.ok) {
      const errorData = await response.text();
      handleError(errorData);
      throw new Error("Network response was not ok");
    }
    const data = await response.json();
    console.log("Fetched log details:", data);
    return data;
  } catch (error) {
    console.error("Failed to fetch log details:", error);
    throw error;
  }
 };
--- a/ui/litellm-dashboard/src/components/view_logs/index.tsx
+++ b/ui/litellm-dashboard/src/components/view_logs/index.tsx
@ -1,11 +1,12 @@
 import moment from "moment";
-import { useQuery } from "@tanstack/react-query";
+import { useQuery, useQueries, useQueryClient } from "@tanstack/react-query";
 import { useState, useRef, useEffect } from "react";
-import { uiSpendLogsCall } from "../networking";
+import { uiSpendLogsCall, uiSpendLogDetailsCall } from "../networking";
 import { DataTable } from "./table";
 import { columns, LogEntry } from "./columns";
-import { Row } from "@tanstack/react-table";
+import { RequestViewer } from "./request_viewer";
 import { prefetchLogDetails } from "./prefetch";
 interface SpendLogsTableProps {
  accessToken: string | null;
@ -54,6 +55,8 @@ export default function SpendLogsTable({
  const [selectedKeyHash, setSelectedKeyHash] = useState("");
  const [selectedFilter, setSelectedFilter] = useState("Team ID");
  const queryClient = useQueryClient();
  // Close dropdown when clicking outside
  useEffect(() => {
    function handleClickOutside(event: MouseEvent) {
@ -82,6 +85,7 @@ export default function SpendLogsTable({
      document.removeEventListener("mousedown", handleClickOutside);
  }, []);
  // Update the logs query to use the imported prefetchLogDetails
  const logs = useQuery<PaginatedResponse>({
    queryKey: [
      "logs",
@ -105,13 +109,21 @@ export default function SpendLogsTable({
        };
      }
-      // Convert times to UTC before formatting
+      console.log("Fetching logs with params:", {
        startTime,
        endTime,
        selectedTeamId,
        selectedKeyHash,
        currentPage,
        pageSize
      });
      const formattedStartTime = moment(startTime).utc().format("YYYY-MM-DD HH:mm:ss");
      const formattedEndTime = isCustomDate 
        ? moment(endTime).utc().format("YYYY-MM-DD HH:mm:ss")
        : moment().utc().format("YYYY-MM-DD HH:mm:ss");
-      return await uiSpendLogsCall(
+      const response = await uiSpendLogsCall(
        accessToken,
        selectedKeyHash || undefined,
        selectedTeamId || undefined,
@ -121,30 +133,62 @@ export default function SpendLogsTable({
        currentPage,
        pageSize
      );
      console.log("Received logs response:", response);
      // Update prefetchLogDetails call with new parameters
      prefetchLogDetails(response.data, formattedStartTime, accessToken, queryClient);
      return response;
    },
    enabled: !!accessToken && !!token && !!userRole && !!userID,
    refetchInterval: 5000,
    refetchIntervalInBackground: true,
  });
  // Move useQueries before the early return
  const logDetailsQueries = useQueries({
    queries: logs.data?.data?.map((log) => ({
      queryKey: ["logDetails", log.request_id, moment(startTime).utc().format("YYYY-MM-DD HH:mm:ss")],
      queryFn: () => uiSpendLogDetailsCall(accessToken!, log.request_id, moment(startTime).utc().format("YYYY-MM-DD HH:mm:ss")),
      staleTime: 10 * 60 * 1000,
      cacheTime: 10 * 60 * 1000,
      enabled: !!log.request_id,
    })) || []
  });
  if (!accessToken || !token || !userRole || !userID) {
-    console.log(
+    console.log("got None values for one of accessToken, token, userRole, userID");
      "got None values for one of accessToken, token, userRole, userID",
    );
    return null;
  }
-  const filteredData =
+  // Consolidate log details from queries
-    logs.data?.data?.filter((log) => {
+  const logDetails: Record<string, any> = {};
-      const matchesSearch =
+  logDetailsQueries.forEach((q, index) => {
-        !searchTerm ||
+    const log = logs.data?.data[index];
-        log.request_id.includes(searchTerm) ||
+    if (log && q.data) {
-        log.model.includes(searchTerm) ||
+      logDetails[log.request_id] = q.data;
-        (log.user && log.user.includes(searchTerm));
+    }
  });
-      // No need for additional filtering since we're now handling this in the API call
+  // Modify the filtered data to include log details
-      return matchesSearch;
+  const filteredData =
-    }) || [];
+    logs.data?.data
      ?.filter((log) => {
        const matchesSearch =
          !searchTerm ||
          log.request_id.includes(searchTerm) ||
          log.model.includes(searchTerm) ||
          (log.user && log.user.includes(searchTerm));
        return matchesSearch;
      })
      .map(log => ({
        ...log,
        // Include messages/response from cached details
        messages: logDetails[log.request_id]?.messages || [],
        response: logDetails[log.request_id]?.response || {},
      })) || [];
  // Add this function to handle manual refresh
  const handleRefresh = () => {
@ -529,155 +573,3 @@ export default function SpendLogsTable({
    </div>
  );
 }
 function RequestViewer({ row }: { row: Row<LogEntry> }) {
  const formatData = (input: any) => {
    if (typeof input === "string") {
      try {
        return JSON.parse(input);
      } catch {
        return input;
      }
    }
    return input;
  };
  return (
    <div className="p-6 bg-gray-50 space-y-6">
      {/* Combined Info Card */}
      <div className="bg-white rounded-lg shadow">
        <div className="p-4 border-b">
          <h3 className="text-lg font-medium ">Request Details</h3>
        </div>
        <div className="space-y-2 p-4 ">
          <div className="flex">
            <span className="font-medium w-1/3">Request ID:</span>
            <span>{row.original.request_id}</span>
          </div>
          <div className="flex">
            <span className="font-medium w-1/3">Api Key:</span>
            <span>{row.original.api_key}</span>
          </div>
          <div className="flex">
            <span className="font-medium w-1/3">Team ID:</span>
            <span>{row.original.team_id}</span>
          </div>
          <div className="flex">
            <span className="font-medium w-1/3">Model:</span>
            <span>{row.original.model}</span>
          </div>
          <div className="flex">
            <span className="font-medium w-1/3">Api Base:</span>
            <span>{row.original.api_base}</span>
          </div>
          <div className="flex">
            <span className="font-medium w-1/3">Call Type:</span>
            <span>{row.original.call_type}</span>
          </div>
          <div className="flex">
            <span className="font-medium w-1/3">Spend:</span>
            <span>{row.original.spend}</span>
          </div>
          <div className="flex">
            <span className="font-medium w-1/3">Total Tokens:</span>
            <span>{row.original.total_tokens}</span>
          </div>
          <div className="flex">
            <span className="font-medium w-1/3">Prompt Tokens:</span>
            <span>{row.original.prompt_tokens}</span>
          </div>
          <div className="flex">
            <span className="font-medium w-1/3">Completion Tokens:</span>
            <span>{row.original.completion_tokens}</span>
          </div>
          <div className="flex">
            <span className="font-medium w-1/3">Start Time:</span>
            <span>{row.original.startTime}</span>
          </div>
          <div className="flex">
            <span className="font-medium w-1/3">End Time:</span>
            <span>{row.original.endTime}</span>
          </div>
          <div className="flex">
            <span className="font-medium w-1/3">Cache Hit:</span>
            <span>{row.original.cache_hit}</span>
          </div>
          <div className="flex">
            <span className="font-medium w-1/3">Cache Key:</span>
            <span>{row.original.cache_key}</span>
          </div>
          {row?.original?.requester_ip_address && (
            <div className="flex">
              <span className="font-medium w-1/3">Request IP Address:</span>
              <span>{row?.original?.requester_ip_address}</span>
            </div>
          )}
        </div>
      </div>
      {/* Request Card */}
      <div className="bg-white rounded-lg shadow">
        <div className="flex justify-between items-center p-4 border-b">
          <h3 className="text-lg font-medium">Request Tags</h3>
        </div>
        <pre className="p-4  text-wrap overflow-auto text-sm">
          {JSON.stringify(formatData(row.original.request_tags), null, 2)}
        </pre>
      </div>
      {/* Request Card */}
      <div className="bg-white rounded-lg shadow">
        <div className="flex justify-between items-center p-4 border-b">
          <h3 className="text-lg font-medium">Request</h3>
          {/* <div>
            <button className="mr-2 px-3 py-1 text-sm border rounded hover:bg-gray-50">
              Expand
            </button>
            <button className="px-3 py-1 text-sm border rounded hover:bg-gray-50">
              JSON
            </button>
          </div> */}
        </div>
        <pre className="p-4  text-wrap overflow-auto text-sm">
          {JSON.stringify(formatData(row.original.messages), null, 2)}
        </pre>
      </div>
      {/* Response Card */}
      <div className="bg-white rounded-lg shadow">
        <div className="flex justify-between items-center p-4 border-b">
          <h3 className="text-lg font-medium">Response</h3>
          <div>
            {/* <button className="mr-2 px-3 py-1 text-sm border rounded hover:bg-gray-50">
              Expand
            </button>
            <button className="px-3 py-1 text-sm border rounded hover:bg-gray-50">
              JSON
            </button> */}
          </div>
        </div>
        <pre className="p-4 text-wrap overflow-auto text-sm">
          {JSON.stringify(formatData(row.original.response), null, 2)}
        </pre>
      </div>
      {/* Metadata Card */}
      {row.original.metadata &&
        Object.keys(row.original.metadata).length > 0 && (
          <div className="bg-white rounded-lg shadow">
            <div className="flex justify-between items-center p-4 border-b">
              <h3 className="text-lg font-medium">Metadata</h3>
              {/* <div>
                <button className="px-3 py-1 text-sm border rounded hover:bg-gray-50">
                  JSON
                </button>
              </div> */}
            </div>
            <pre className="p-4 text-wrap  overflow-auto text-sm ">
              {JSON.stringify(row.original.metadata, null, 2)}
            </pre>
          </div>
        )}
    </div>
  );
 }
--- a/ui/litellm-dashboard/src/components/view_logs/prefetch.ts
+++ b/ui/litellm-dashboard/src/components/view_logs/prefetch.ts
@ -0,0 +1,23 @@
 import { QueryClient } from "@tanstack/react-query";
 import { uiSpendLogDetailsCall } from "../networking";
 import { LogEntry } from "./columns";
 export const prefetchLogDetails = (
  logs: LogEntry[], 
  formattedStartTime: string,
  accessToken: string,
  queryClient: QueryClient
 ) => {
  logs.forEach((log) => {
    if (log.request_id) {
      queryClient.prefetchQuery({
        queryKey: ["logDetails", log.request_id, formattedStartTime],
        queryFn: () => uiSpendLogDetailsCall(accessToken, log.request_id, formattedStartTime),
        staleTime: 10 * 60 * 1000, // 10 minutes
        gcTime: 10 * 60 * 1000, // 10 minutes
      }).catch((error) => {
        console.error(`Failed to prefetch details for log: ${log.request_id}`, error);
      });
    }
  });
 };
--- a/ui/litellm-dashboard/src/components/view_logs/request_viewer.tsx
+++ b/ui/litellm-dashboard/src/components/view_logs/request_viewer.tsx
@ -0,0 +1,155 @@
 import { Row } from "@tanstack/react-table";
 import { LogEntry } from "./columns";
 export function RequestViewer({ row }: { row: Row<LogEntry> }) {
    const formatData = (input: any) => {
      if (typeof input === "string") {
        try {
          return JSON.parse(input);
        } catch {
          return input;
        }
      }
      return input;
    };
    return (
      <div className="p-6 bg-gray-50 space-y-6">
        {/* Combined Info Card */}
        <div className="bg-white rounded-lg shadow">
          <div className="p-4 border-b">
            <h3 className="text-lg font-medium ">Request Details</h3>
          </div>
          <div className="space-y-2 p-4 ">
            <div className="flex">
              <span className="font-medium w-1/3">Request ID:</span>
              <span>{row.original.request_id}</span>
            </div>
            <div className="flex">
              <span className="font-medium w-1/3">Api Key:</span>
              <span>{row.original.api_key}</span>
            </div>
            <div className="flex">
              <span className="font-medium w-1/3">Team ID:</span>
              <span>{row.original.team_id}</span>
            </div>
            <div className="flex">
              <span className="font-medium w-1/3">Model:</span>
              <span>{row.original.model}</span>
            </div>
            <div className="flex">
              <span className="font-medium w-1/3">Api Base:</span>
              <span>{row.original.api_base}</span>
            </div>
            <div className="flex">
              <span className="font-medium w-1/3">Call Type:</span>
              <span>{row.original.call_type}</span>
            </div>
            <div className="flex">
              <span className="font-medium w-1/3">Spend:</span>
              <span>{row.original.spend}</span>
            </div>
            <div className="flex">
              <span className="font-medium w-1/3">Total Tokens:</span>
              <span>{row.original.total_tokens}</span>
            </div>
            <div className="flex">
              <span className="font-medium w-1/3">Prompt Tokens:</span>
              <span>{row.original.prompt_tokens}</span>
            </div>
            <div className="flex">
              <span className="font-medium w-1/3">Completion Tokens:</span>
              <span>{row.original.completion_tokens}</span>
            </div>
            <div className="flex">
              <span className="font-medium w-1/3">Start Time:</span>
              <span>{row.original.startTime}</span>
            </div>
            <div className="flex">
              <span className="font-medium w-1/3">End Time:</span>
              <span>{row.original.endTime}</span>
            </div>
            <div className="flex">
              <span className="font-medium w-1/3">Cache Hit:</span>
              <span>{row.original.cache_hit}</span>
            </div>
            <div className="flex">
              <span className="font-medium w-1/3">Cache Key:</span>
              <span>{row.original.cache_key}</span>
            </div>
            {row?.original?.requester_ip_address && (
              <div className="flex">
                <span className="font-medium w-1/3">Request IP Address:</span>
                <span>{row?.original?.requester_ip_address}</span>
              </div>
            )}
          </div>
        </div>
        {/* Request Card */}
        <div className="bg-white rounded-lg shadow">
          <div className="flex justify-between items-center p-4 border-b">
            <h3 className="text-lg font-medium">Request Tags</h3>
          </div>
          <pre className="p-4  text-wrap overflow-auto text-sm">
            {JSON.stringify(formatData(row.original.request_tags), null, 2)}
          </pre>
        </div>
        {/* Request Card */}
        <div className="bg-white rounded-lg shadow">
          <div className="flex justify-between items-center p-4 border-b">
            <h3 className="text-lg font-medium">Request</h3>
            {/* <div>
              <button className="mr-2 px-3 py-1 text-sm border rounded hover:bg-gray-50">
                Expand
              </button>
              <button className="px-3 py-1 text-sm border rounded hover:bg-gray-50">
                JSON
              </button>
            </div> */}
          </div>
          <pre className="p-4  text-wrap overflow-auto text-sm">
            {JSON.stringify(formatData(row.original.messages), null, 2)}
          </pre>
        </div>
        {/* Response Card */}
        <div className="bg-white rounded-lg shadow">
          <div className="flex justify-between items-center p-4 border-b">
            <h3 className="text-lg font-medium">Response</h3>
            <div>
              {/* <button className="mr-2 px-3 py-1 text-sm border rounded hover:bg-gray-50">
                Expand
              </button>
              <button className="px-3 py-1 text-sm border rounded hover:bg-gray-50">
                JSON
              </button> */}
            </div>
          </div>
          <pre className="p-4 text-wrap overflow-auto text-sm">
            {JSON.stringify(formatData(row.original.response), null, 2)}
          </pre>
        </div>
        {/* Metadata Card */}
        {row.original.metadata &&
          Object.keys(row.original.metadata).length > 0 && (
            <div className="bg-white rounded-lg shadow">
              <div className="flex justify-between items-center p-4 border-b">
                <h3 className="text-lg font-medium">Metadata</h3>
                {/* <div>
                  <button className="px-3 py-1 text-sm border rounded hover:bg-gray-50">
                    JSON
                  </button>
                </div> */}
              </div>
              <pre className="p-4 text-wrap  overflow-auto text-sm ">
                {JSON.stringify(row.original.metadata, null, 2)}
              </pre>
            </div>
          )}
      </div>
    );
  }