mirror of
https://github.com/BerriAI/litellm.git
synced 2025-04-26 03:04:13 +00:00
clean up model latency metrics
This commit is contained in:
parent
38cf04cc38
commit
94b98f5c4e
1 changed files with 21 additions and 10 deletions
|
@ -7540,15 +7540,24 @@ async def model_metrics(
|
||||||
endTime = endTime or datetime.now()
|
endTime = endTime or datetime.now()
|
||||||
|
|
||||||
sql_query = """
|
sql_query = """
|
||||||
SELECT api_base, model, DATE_TRUNC('day', "startTime")::DATE AS day,
|
SELECT
|
||||||
CASE
|
api_base,
|
||||||
WHEN SUM(total_tokens) = 0 THEN 0
|
model,
|
||||||
ELSE AVG(EXTRACT(epoch FROM ("endTime" - "startTime"))) / SUM(total_tokens)
|
DATE_TRUNC('day', "startTime")::DATE AS day,
|
||||||
END AS avg_latency_per_token
|
AVG(EXTRACT(epoch FROM ("endTime" - "startTime"))) / SUM(total_tokens) AS avg_latency_per_token
|
||||||
FROM "LiteLLM_SpendLogs"
|
FROM
|
||||||
WHERE "startTime" >= NOW() - INTERVAL '30 days' AND "model" = $1
|
"LiteLLM_SpendLogs"
|
||||||
GROUP BY api_base, model, day
|
WHERE
|
||||||
ORDER BY avg_latency_per_token DESC;
|
"startTime" >= NOW() - INTERVAL '30 days'
|
||||||
|
AND "model" = $1
|
||||||
|
GROUP BY
|
||||||
|
api_base,
|
||||||
|
model,
|
||||||
|
day
|
||||||
|
HAVING
|
||||||
|
SUM(total_tokens) > 0
|
||||||
|
ORDER BY
|
||||||
|
avg_latency_per_token DESC;
|
||||||
"""
|
"""
|
||||||
_all_api_bases = set()
|
_all_api_bases = set()
|
||||||
db_response = await prisma_client.db.query_raw(
|
db_response = await prisma_client.db.query_raw(
|
||||||
|
@ -7566,6 +7575,8 @@ async def model_metrics(
|
||||||
_combined_model_name = str(_model)
|
_combined_model_name = str(_model)
|
||||||
if "https://" in _api_base:
|
if "https://" in _api_base:
|
||||||
_combined_model_name = str(_api_base)
|
_combined_model_name = str(_api_base)
|
||||||
|
if "/openai/" in _combined_model_name:
|
||||||
|
_combined_model_name = _combined_model_name.split("/openai/")[0]
|
||||||
|
|
||||||
_all_api_bases.add(_combined_model_name)
|
_all_api_bases.add(_combined_model_name)
|
||||||
_daily_entries[_day][_combined_model_name] = _avg_latency_per_token
|
_daily_entries[_day][_combined_model_name] = _avg_latency_per_token
|
||||||
|
@ -7587,7 +7598,7 @@ async def model_metrics(
|
||||||
for day in _daily_entries:
|
for day in _daily_entries:
|
||||||
entry = {"date": str(day)}
|
entry = {"date": str(day)}
|
||||||
for model_key, latency in _daily_entries[day].items():
|
for model_key, latency in _daily_entries[day].items():
|
||||||
entry[model_key] = latency.__round__(5)
|
entry[model_key] = round(latency, 8)
|
||||||
response.append(entry)
|
response.append(entry)
|
||||||
|
|
||||||
return {
|
return {
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue