forked from phoenix/litellm-mirror
working token counter endpoint
This commit is contained in:
parent
e50284bc72
commit
d42e5fcbd5
2 changed files with 26 additions and 15 deletions
|
@ -1001,3 +1001,15 @@ class LiteLLM_ErrorLogs(LiteLLMBase):
|
|||
|
||||
class LiteLLM_SpendLogs_ResponseObject(LiteLLMBase):
|
||||
response: Optional[List[Union[LiteLLM_SpendLogs, Any]]] = None
|
||||
|
||||
|
||||
class TokenCountRequest(LiteLLMBase):
|
||||
model: str
|
||||
prompt: Optional[str] = None
|
||||
messages: Optional[List[dict]] = None
|
||||
|
||||
|
||||
class TokenCountResponse(LiteLLMBase):
|
||||
total_tokens: int
|
||||
model: str
|
||||
custom_llm_provider: str
|
||||
|
|
|
@ -4766,25 +4766,24 @@ async def moderations(
|
|||
|
||||
|
||||
@router.post(
|
||||
"/dev/token_counter ",
|
||||
tags=["LLM Utils"],
|
||||
dependencies=[Depends(user_api_key_auth)],
|
||||
responses={
|
||||
200: {
|
||||
"cost": {
|
||||
"description": "The calculated cost",
|
||||
"example": 0.0,
|
||||
"type": "float",
|
||||
}
|
||||
}
|
||||
},
|
||||
"/dev/token_counter", tags=["LLM Utils"], dependencies=[Depends(user_api_key_auth)]
|
||||
)
|
||||
async def token_counter(request: Request):
|
||||
async def token_counter(request: TokenCountRequest):
|
||||
""" """
|
||||
from litellm import token_counter
|
||||
|
||||
data = await request.json()
|
||||
total_tokens = token_counter(**data)
|
||||
prompt = request.prompt
|
||||
messages = request.messages
|
||||
|
||||
if prompt is None and messages is None:
|
||||
raise HTTPException(
|
||||
status_code=400, detail="prompt or messages must be provided"
|
||||
)
|
||||
total_tokens = token_counter(
|
||||
model=request.model,
|
||||
text=prompt,
|
||||
messages=messages,
|
||||
)
|
||||
return {"total_tokens": total_tokens}
|
||||
|
||||
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue