add response ms to response object

2023-09-20 19:50:38 -07:00 · 2023-09-20 19:50:38 -07:00 · 39c3f2d6ec
commit 39c3f2d6ec
parent fc922bc300
4 changed files with 9 additions and 3 deletions
--- a/litellm/pycache/utils.cpython-311.pyc
+++ b/litellm/pycache/utils.cpython-311.pyc
--- a/litellm/tests/test_completion.py
+++ b/litellm/tests/test_completion.py
@ -791,7 +791,8 @@ def test_completion_ai21():
    try:
        response = completion(model=model_name, messages=messages)
        # Add any assertions here to check the response
-        print(response)
+        print(response["response_ms"])
        print(response.response_ms)
    except Exception as e:
        pytest.fail(f"Error occurred: {e}")
--- a/litellm/utils.py
+++ b/litellm/utils.py
@ -123,7 +123,7 @@ class StreamingChoices(OpenAIObject):
            self.delta = Delta()
 class ModelResponse(OpenAIObject):
-    def __init__(self, id=None, choices=None, created=None, model=None, usage=None, stream=False, **params):
+    def __init__(self, id=None, choices=None, created=None, model=None, usage=None, stream=False, response_ms=None, **params):
        if stream:
            self.object = "chat.completion.chunk"
            self.choices = [StreamingChoices()]
@ -141,6 +141,10 @@ class ModelResponse(OpenAIObject):
            self.created = int(time.time())
        else:
            self.created = created
        if response_ms:
            response_ms = response_ms
        else:
            response_ms = None
        self.model = model
        self.usage = (
            usage
@ -624,6 +628,7 @@ def client(original_function):
            )  # don't interrupt execution of main thread
            my_thread.start()
            # RETURN RESULT
            result.response_ms = (end_time - start_time).total_seconds() * 1000 # return response latency in ms like openai
            return result
        except Exception as e:
            traceback_exception = traceback.format_exc()
--- a/pyproject.toml
+++ b/pyproject.toml
@ -1,6 +1,6 @@
 [tool.poetry]
 name = "litellm"
-version = "0.1.717"
+version = "0.1.718"
 description = "Library to easily interface with LLM API providers"
 authors = ["BerriAI"]
 license = "MIT License"