/utils/token_counter: get model_info from deployment directly (#10047)

This commit is contained in:
ChaoFu Yang 2025-04-16 22:53:18 +08:00 committed by GitHub
parent e19d05980c
commit c07eea864e
No known key found for this signature in database
GPG key ID: B5690EEEBB952194

View file

@ -5290,10 +5290,7 @@ async def token_counter(request: TokenCountRequest):
for _model in llm_router.model_list: for _model in llm_router.model_list:
if _model["model_name"] == request.model: if _model["model_name"] == request.model:
deployment = _model deployment = _model
model_info = llm_router.get_router_model_info( model_info = deployment.get("model_info", {})
deployment=deployment,
received_model_name=request.model,
)
break break
if deployment is not None: if deployment is not None:
litellm_model_name = deployment.get("litellm_params", {}).get("model") litellm_model_name = deployment.get("litellm_params", {}).get("model")