fix latency calc (lower better)

This commit is contained in:
stephenleo 2024-02-11 17:06:46 +08:00
parent 1391490d92
commit 37c83e0023

View file

@ -86,7 +86,7 @@ class LowestLatencyLoggingHandler(CustomLogger):
if isinstance(response_obj, ModelResponse):
completion_tokens = response_obj.usage.completion_tokens
total_tokens = response_obj.usage.total_tokens
final_value = float(completion_tokens / response_ms.total_seconds())
final_value = float(response_ms.total_seconds() / completion_tokens)
# ------------
# Update usage