feat(utils.py): support custom cost tracking per second

https://github.com/BerriAI/litellm/issues/1374
2024-01-22 11:15:08 -08:00 · 2024-01-22 11:15:08 -08:00 · 276a685a59
commit 276a685a59
parent 44f756efb5
4 changed files with 74 additions and 31 deletions
--- a/litellm/tests/test_completion.py
+++ b/litellm/tests/test_completion.py
@ -1372,16 +1372,21 @@ def test_customprompt_together_ai():

 def test_completion_sagemaker():
    try:
-        print("testing sagemaker")
        litellm.set_verbose = True
+        print("testing sagemaker")
        response = completion(
            model="sagemaker/berri-benchmarking-Llama-2-70b-chat-hf-4",
            messages=messages,
            temperature=0.2,
            max_tokens=80,
+            input_cost_per_second=0.000420,
        )
        # Add any assertions here to check the response
        print(response)
+        cost = completion_cost(completion_response=response)
+        assert (
+            cost > 0.0 and cost < 1.0
+        )  # should never be > $1 for a single completion call
    except Exception as e:
        pytest.fail(f"Error occurred: {e}")