fix(parallel_request_limiter.py): return remaining tpm/rpm in openai-compatible way

Fixes https://github.com/BerriAI/litellm/issues/5957
2025-04-25 10:44:24 +00:00 · 2024-09-28 15:56:12 -07:00 · 2024-09-28 15:56:12 -07:00 · 5222fc8e1b
commit 5222fc8e1b
parent c0cdc6e496
4 changed files with 166 additions and 2 deletions
--- a/litellm/proxy/utils.py
+++ b/litellm/proxy/utils.py
@ -35,7 +35,13 @@ from typing_extensions import overload
 import litellm
 import litellm.litellm_core_utils
 import litellm.litellm_core_utils.litellm_logging
-from litellm import EmbeddingResponse, ImageResponse, ModelResponse, get_litellm_params
+from litellm import (
+    EmbeddingResponse,
+    ImageResponse,
+    ModelResponse,
+    Router,
+    get_litellm_params,
+)
 from litellm._logging import verbose_proxy_logger
 from litellm._service_logger import ServiceLogging, ServiceTypes
 from litellm.caching import DualCache, RedisCache