From c07eea864ee1cda3a5097ae366bc5a13e8ed61cd Mon Sep 17 00:00:00 2001 From: ChaoFu Yang Date: Wed, 16 Apr 2025 22:53:18 +0800 Subject: [PATCH] /utils/token_counter: get model_info from deployment directly (#10047) --- litellm/proxy/proxy_server.py | 5 +---- 1 file changed, 1 insertion(+), 4 deletions(-) diff --git a/litellm/proxy/proxy_server.py b/litellm/proxy/proxy_server.py index 2062173f50..d28633ccbe 100644 --- a/litellm/proxy/proxy_server.py +++ b/litellm/proxy/proxy_server.py @@ -5290,10 +5290,7 @@ async def token_counter(request: TokenCountRequest): for _model in llm_router.model_list: if _model["model_name"] == request.model: deployment = _model - model_info = llm_router.get_router_model_info( - deployment=deployment, - received_model_name=request.model, - ) + model_info = deployment.get("model_info", {}) break if deployment is not None: litellm_model_name = deployment.get("litellm_params", {}).get("model")