Merge pull request #3412 from sumanth13131/usage-based-routing-ttl-on-cache

usage-based-routing-ttl-on-cache
2025-04-25 10:44:24 +00:00 · 2024-05-21 07:58:41 -07:00 · 2024-05-21 07:58:41 -07:00 · 2cda5a2bc3
commit 2cda5a2bc3
parent 07abccf96f 71e0294485
4 changed files with 98 additions and 14 deletions
--- a/litellm/router.py
+++ b/litellm/router.py
@ -374,13 +374,17 @@ class Router:
                litellm.callbacks.append(self.leastbusy_logger)  # type: ignore
        elif routing_strategy == "usage-based-routing":
            self.lowesttpm_logger = LowestTPMLoggingHandler(
-                router_cache=self.cache, model_list=self.model_list
+                router_cache=self.cache,
+                model_list=self.model_list,
+                routing_args=routing_strategy_args
            )
            if isinstance(litellm.callbacks, list):
                litellm.callbacks.append(self.lowesttpm_logger)  # type: ignore
        elif routing_strategy == "usage-based-routing-v2":
            self.lowesttpm_logger_v2 = LowestTPMLoggingHandler_v2(
-                router_cache=self.cache, model_list=self.model_list
+                router_cache=self.cache,
+                model_list=self.model_list,
+                routing_args=routing_strategy_args
            )
            if isinstance(litellm.callbacks, list):
                litellm.callbacks.append(self.lowesttpm_logger_v2)  # type: ignore