fix(lowest_latency.py): consistent time calc

This commit is contained in:
Krrish Dholakia 2024-02-14 15:03:35 -08:00
parent a6d5d0f714
commit fccacaf91b

View file

@ -168,7 +168,7 @@ class LowestLatencyLoggingHandler(CustomLogger):
if isinstance(response_obj, ModelResponse):
completion_tokens = response_obj.usage.completion_tokens
total_tokens = response_obj.usage.total_tokens
final_value = float(completion_tokens / response_ms.total_seconds())
final_value = float(response_ms.total_seconds() / completion_tokens)
# ------------
# Update usage