fix(lowest_tpm_rpm_v2.py): use a combined tpm+rpm query in async get cache, to reduce redis client calls in high traffic

2025-04-25 18:54:30 +00:00 · 2024-04-20 16:13:11 -07:00 · 2024-04-20 16:13:11 -07:00 · 9379e3d047
commit 9379e3d047
parent c5d880b6fd
4 changed files with 54 additions and 28 deletions
--- a/litellm/integrations/prometheus.py
+++ b/litellm/integrations/prometheus.py
@ -19,7 +19,7 @@ class PrometheusLogger:
        **kwargs,
    ):
        try:
-            verbose_logger.debug(f"in init prometheus metrics")
+            print(f"in init prometheus metrics")
            from prometheus_client import Counter

            self.litellm_llm_api_failed_requests_metric = Counter(