fix - test end user rate limits with master key

2024-05-22 16:23:15 -07:00 · 2024-05-22 16:23:15 -07:00 · 4175d00a24
commit 4175d00a24
parent a848a676af
1 changed files with 51 additions and 1 deletions
--- a/tests/test_end_users.py
+++ b/tests/test_end_users.py
@ -199,7 +199,7 @@ async def test_end_user_specific_region():


@pytest.mark.asyncio
-async def test_end_tpm_limits():
+async def test_enduser_tpm_limits_non_master_key():
    """
    1. budget_id = Create Budget with tpm_limit = 10
    2. create end_user with budget_id
@ -235,6 +235,56 @@ async def test_end_tpm_limits():

    print("\nchat completion result 1=", result)

+    # chat completion 2
+    try:
+        result = await client.chat.completions.create(
+            model="fake-openai-endpoint",
+            messages=[{"role": "user", "content": "Hey!"}],
+            user=end_user_id,
+        )
+        pytest.fail(
+            "User crossed their limit - this should have failed. instead got result = {}".format(
+                result
+            )
+        )
+    except Exception as e:
+        print("got exception 2 =", e)
+        assert "Crossed TPM, RPM Limit" in str(
+            e
+        ), f"Expected 'Crossed TPM, RPM Limit' but got {str(e)}"
+
+
+@pytest.mark.asyncio
+async def test_enduser_tpm_limits_with_master_key():
+    """
+    1. budget_id = Create Budget with tpm_limit = 10
+    2. create end_user with budget_id
+    3. Make /chat/completions calls
+    4. Sleep 1 second
+    4. Make  /chat/completions call -> expect this to fail because rate limit hit
+    """
+    async with aiohttp.ClientSession() as session:
+        # create a budget with budget_id = "free-tier"
+        budget_id = f"free-tier-{uuid.uuid4()}"
+        await new_budget(session, 0, budget_id=budget_id)
+
+        end_user_id = str(uuid.uuid4())
+
+        await new_end_user(
+            session=session, i=0, user_id=end_user_id, budget_id=budget_id
+        )
+
+    # chat completion 1
+    client = AsyncOpenAI(api_key="sk-1234", base_url="http://0.0.0.0:4000")
+
+    result = await client.chat.completions.create(
+        model="fake-openai-endpoint",
+        messages=[{"role": "user", "content": "Hey!"}],
+        user=end_user_id,
+    )
+
+    print("\nchat completion result 1=", result)
+
    await asyncio.sleep(1)

    # chat completion 2