Litellm dev 12 06 2024 (#7067)

* fix(edit_budget_modal.tsx): call `/budget/update` endpoint instead of `/budget/new` allows updating existing budget on ui * fix(user_api_key_auth.py): support cost tracking for end user via jwt field * fix(presidio.py): support pii masking on sync logging callbacks enables masking before logging to langfuse * feat(utils.py): support retry policy logic inside '.completion()' Fixes https://github.com/BerriAI/litellm/issues/6623 * fix(utils.py): support retry by retry policy on async logic as well * fix(handle_jwt.py): set leeway default leeway value * test: fix test to handle jwt audience claim
2025-04-27 03:34:10 +00:00 · 2024-12-06 22:44:18 -08:00 · 2024-12-06 22:44:18 -08:00 · df3da2e5d2
commit df3da2e5d2
parent f564981556
21 changed files with 498 additions and 498 deletions
--- a/tests/local_testing/test_completion_with_retries.py
+++ b/tests/local_testing/test_completion_with_retries.py
@ -61,3 +61,68 @@ def test_completion_with_0_num_retries():
    except Exception as e:
        print("exception", e)
        pass
+
+
+@pytest.mark.asyncio
+@pytest.mark.parametrize("sync_mode", [True, False])
+async def test_completion_with_retry_policy(sync_mode):
+    from unittest.mock import patch, MagicMock, AsyncMock
+    from litellm.types.router import RetryPolicy
+
+    retry_number = 1
+    retry_policy = RetryPolicy(
+        ContentPolicyViolationErrorRetries=retry_number,  # run 3 retries for ContentPolicyViolationErrors
+        AuthenticationErrorRetries=0,  # run 0 retries for AuthenticationErrorRetries
+    )
+
+    target_function = "completion_with_retries"
+
+    with patch.object(litellm, target_function) as mock_completion_with_retries:
+        data = {
+            "model": "azure/gpt-3.5-turbo",
+            "messages": [{"gm": "vibe", "role": "user"}],
+            "retry_policy": retry_policy,
+            "mock_response": "Exception: content_filter_policy",
+        }
+        try:
+            if sync_mode:
+                completion(**data)
+            else:
+                await completion(**data)
+        except Exception as e:
+            print(e)
+
+        mock_completion_with_retries.assert_called_once()
+        assert (
+            mock_completion_with_retries.call_args.kwargs["num_retries"] == retry_number
+        )
+        assert retry_policy.ContentPolicyViolationErrorRetries == retry_number
+
+
+@pytest.mark.asyncio
+@pytest.mark.parametrize("sync_mode", [True, False])
+async def test_completion_with_retry_policy_no_error(sync_mode):
+    """
+    Test that the completion function does not throw an error when the retry policy is set
+    """
+    from unittest.mock import patch, MagicMock, AsyncMock
+    from litellm.types.router import RetryPolicy
+
+    retry_number = 1
+    retry_policy = RetryPolicy(
+        ContentPolicyViolationErrorRetries=retry_number,  # run 3 retries for ContentPolicyViolationErrors
+        AuthenticationErrorRetries=0,  # run 0 retries for AuthenticationErrorRetries
+    )
+
+    data = {
+        "model": "gpt-3.5-turbo",
+        "messages": [{"gm": "vibe", "role": "user"}],
+        "retry_policy": retry_policy,
+    }
+    try:
+        if sync_mode:
+            completion(**data)
+        else:
+            await completion(**data)
+    except Exception as e:
+        print(e)