Merge pull request #3897 from BerriAI/litellm_fix_latency_cal

ui - fix latency analytics on `completion_tokens`
2024-05-29 17:32:17 -07:00 · 2024-05-29 17:32:17 -07:00 · ea30769190
commit ea30769190
parent f9b98c57a2 02598ae988
1 changed files with 2 additions and 2 deletions
--- a/litellm/proxy/proxy_server.py
+++ b/litellm/proxy/proxy_server.py
@ -10209,7 +10209,7 @@ async def model_metrics(
            model_group,
            model,
            DATE_TRUNC('day', "startTime")::DATE AS day,
-            AVG(EXTRACT(epoch FROM ("endTime" - "startTime"))) / SUM(total_tokens) AS avg_latency_per_token
+            AVG(EXTRACT(epoch FROM ("endTime" - "startTime")) / "completion_tokens") AS avg_latency_per_token
        FROM
            "LiteLLM_SpendLogs"
        WHERE
@ -10221,7 +10221,7 @@ async def model_metrics(
            model,
            day
        HAVING
-            SUM(total_tokens) > 0
+            SUM(completion_tokens) > 0
        ORDER BY
            avg_latency_per_token DESC;
    """