fix(lowest_latency.py): consistent time calc

This commit is contained in:
Krrish Dholakia 2024-02-14 15:03:35 -08:00
parent a6d5d0f714
commit fccacaf91b

View file

@ -168,7 +168,7 @@ class LowestLatencyLoggingHandler(CustomLogger):
if isinstance(response_obj, ModelResponse): if isinstance(response_obj, ModelResponse):
completion_tokens = response_obj.usage.completion_tokens completion_tokens = response_obj.usage.completion_tokens
total_tokens = response_obj.usage.total_tokens total_tokens = response_obj.usage.total_tokens
final_value = float(completion_tokens / response_ms.total_seconds()) final_value = float(response_ms.total_seconds() / completion_tokens)
# ------------ # ------------
# Update usage # Update usage