(v0) prometheus metric

2025-04-26 11:14:04 +00:00 · 2024-03-19 14:48:38 -07:00 · 2024-03-19 14:48:38 -07:00 · 4b7e102187
commit 4b7e102187
parent 358f94a4c3
1 changed files with 36 additions and 0 deletions
--- a/litellm/proxy/proxy_server.py
+++ b/litellm/proxy/proxy_server.py
@ -983,6 +983,42 @@ def cost_tracking():
                litellm.success_callback.append(_PROXY_track_cost_callback)  # type: ignore
 from prometheus_client import Counter, REGISTRY
 from prometheus_client import make_asgi_app
 # Add prometheus asgi middleware to route /metrics requests
 metrics_app = make_asgi_app()
 app.mount("/metrics", metrics_app)
 try:
    calls_metric = Counter("calls_metric", "Measure of calls")
    tokens_metric = Counter("tokens_metric", "Measure of tokens")
    spend_metric = Counter("spend_metric", "Measure of spend")
 except:
    pass
 # # Define Prometheus counters for metrics
 # Register metrics with the default registry
 def track_prometheus_metrics(
    kwargs,  # kwargs to completion
    completion_response,  # response from completion
    start_time,
    end_time,  # start/end time
 ):
    global calls_metric
    user: str = ("issues",)
    key: str = ("sk-02Wr4IAlN3NvPXvL5JVvDA",)
    model: str = ("gpt-3.5-turbo",)
    budgets = 1
    tokens = 20
    # print("incrementing prometheus metrics")
    calls_metric.labels(user, key, model).inc()
 litellm.callbacks.append(track_prometheus_metrics)
 async def _PROXY_track_cost_callback(
    kwargs,  # kwargs to completion
    completion_response: litellm.ModelResponse,  # response from completion