fix(lowest_tpm_rpm_v2.py): use a combined tpm+rpm query in async get cache, to reduce redis client calls in high traffic

This commit is contained in:
Krrish Dholakia 2024-04-20 16:13:11 -07:00
parent c5d880b6fd
commit 9379e3d047
4 changed files with 54 additions and 28 deletions

View file

@ -19,7 +19,7 @@ class PrometheusLogger:
**kwargs,
):
try:
verbose_logger.debug(f"in init prometheus metrics")
print(f"in init prometheus metrics")
from prometheus_client import Counter
self.litellm_llm_api_failed_requests_metric = Counter(