mirror of
https://github.com/BerriAI/litellm.git
synced 2025-04-26 11:14:04 +00:00
fix(azure): return response headers for sync embedding calls
This commit is contained in:
parent
55d7bc7f32
commit
d64e971d8c
3 changed files with 30 additions and 5 deletions
|
@ -1422,9 +1422,11 @@ def client(original_function):
|
|||
or isinstance(result, EmbeddingResponse)
|
||||
or isinstance(result, TranscriptionResponse)
|
||||
):
|
||||
result._response_ms = (
|
||||
end_time - start_time
|
||||
).total_seconds() * 1000 # return response latency in ms like openai
|
||||
setattr(
|
||||
result,
|
||||
"_response_ms",
|
||||
(end_time - start_time).total_seconds() * 1000,
|
||||
) # return response latency in ms like openai
|
||||
|
||||
### POST-CALL RULES ###
|
||||
post_call_processing(
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue