fix test_async_prometheus_success_logging_with_callbacks

2024-09-09 11:54:11 -07:00 · 2024-09-09 11:54:11 -07:00 · 8a3ac60187
commit 8a3ac60187
parent e253c100f4
1 changed files with 41 additions and 10 deletions
--- a/litellm/tests/test_prometheus.py
+++ b/litellm/tests/test_prometheus.py
@ -9,7 +9,7 @@ import logging
 import uuid

 import pytest
-from prometheus_client import REGISTRY
+from prometheus_client import REGISTRY, CollectorRegistry

 import litellm
 from litellm import completion
@ -85,8 +85,17 @@ async def test_async_prometheus_success_logging():
 async def test_async_prometheus_success_logging_with_callbacks():
    run_id = str(uuid.uuid4())
    litellm.set_verbose = True
+
+    litellm.success_callback = []
+    litellm.failure_callback = []
    litellm.callbacks = ["prometheus"]

+    # Get initial metric values
+    initial_metrics = {}
+    for metric in REGISTRY.collect():
+        for sample in metric.samples:
+            initial_metrics[sample.name] = sample.value
+
    response = await litellm.acompletion(
        model="claude-instant-1.2",
        messages=[{"role": "user", "content": "what llm are u"}],
@ -124,15 +133,37 @@ async def test_async_prometheus_success_logging_with_callbacks():
        vars(test_prometheus_logger.litellm_requests_metric),
    )

-    # Get the metrics
-    metrics = {}
+    # Get the updated metrics
+    updated_metrics = {}
    for metric in REGISTRY.collect():
        for sample in metric.samples:
-            metrics[sample.name] = sample.value
+            updated_metrics[sample.name] = sample.value

-    print("metrics from prometheus", metrics)
-    assert metrics["litellm_requests_metric_total"] == 1.0
-    assert metrics["litellm_total_tokens_total"] == 30.0
-    assert metrics["litellm_deployment_success_responses_total"] == 1.0
-    assert metrics["litellm_deployment_total_requests_total"] == 1.0
-    assert metrics["litellm_deployment_latency_per_output_token_bucket"] == 1.0
+    print("metrics from prometheus", updated_metrics)
+
+    # Assert the delta for each metric
+    assert (
+        updated_metrics["litellm_requests_metric_total"]
+        - initial_metrics.get("litellm_requests_metric_total", 0)
+        == 1.0
+    )
+    assert (
+        updated_metrics["litellm_total_tokens_total"]
+        - initial_metrics.get("litellm_total_tokens_total", 0)
+        == 30.0
+    )
+    assert (
+        updated_metrics["litellm_deployment_success_responses_total"]
+        - initial_metrics.get("litellm_deployment_success_responses_total", 0)
+        == 1.0
+    )
+    assert (
+        updated_metrics["litellm_deployment_total_requests_total"]
+        - initial_metrics.get("litellm_deployment_total_requests_total", 0)
+        == 1.0
+    )
+    assert (
+        updated_metrics["litellm_deployment_latency_per_output_token_bucket"]
+        - initial_metrics.get("litellm_deployment_latency_per_output_token_bucket", 0)
+        == 1.0
+    )