fix(proxy_cli.py-&&-proxy_server.py): bump reset budget intervals and fix pool limits for prisma connections

This commit is contained in:
Krrish Dholakia 2024-02-06 19:39:49 -08:00
parent b6adeec347
commit 4a0df3cb4f
5 changed files with 36 additions and 18 deletions

View file

@ -431,9 +431,9 @@ async def test_key_info_spend_values_image_generation():
@pytest.mark.asyncio
async def test_key_with_budgets():
"""
- Create key with budget and 5s duration
- Create key with budget and 5min duration
- Get 'reset_at' value
- wait 5s
- wait 10min (budget reset runs every 10mins.)
- Check if value updated
"""
from litellm.proxy.utils import hash_token
@ -449,8 +449,8 @@ async def test_key_with_budgets():
reset_at_init_value = key_info["info"]["budget_reset_at"]
reset_at_new_value = None
i = 0
await asyncio.sleep(610)
while i < 3:
await asyncio.sleep(30)
key_info = await get_key_info(session=session, get_key=key, call_key=key)
reset_at_new_value = key_info["info"]["budget_reset_at"]
try:
@ -458,6 +458,7 @@ async def test_key_with_budgets():
break
except:
i + 1
await asyncio.sleep(5)
assert reset_at_init_value != reset_at_new_value
@ -481,7 +482,7 @@ async def test_key_crossing_budget():
response = await chat_completion(session=session, key=key)
print("response 1: ", response)
await asyncio.sleep(2)
await asyncio.sleep(10)
try:
response = await chat_completion(session=session, key=key)
pytest.fail("Should have failed - Key crossed it's budget")

View file

@ -113,6 +113,7 @@ async def test_spend_logs():
await get_spend_logs(session=session, request_id=response["id"])
@pytest.mark.skip(reason="High traffic load test, meant to be run locally")
@pytest.mark.asyncio
async def test_spend_logs_high_traffic():
"""
@ -155,9 +156,12 @@ async def test_spend_logs_high_traffic():
successful_completions = [c for c in chat_completions if c is not None]
print(f"Num successful completions: {len(successful_completions)}")
await asyncio.sleep(10)
response = await get_spend_logs(session=session, api_key=key)
print(f"response: {response}")
print(f"len responses: {len(response)}")
assert len(response) == n
print(n, time.time() - start, len(response))
try:
response = await retry_request(get_spend_logs, session=session, api_key=key)
print(f"response: {response}")
print(f"len responses: {len(response)}")
assert len(response) == n
print(n, time.time() - start, len(response))
except:
print(n, time.time() - start, 0)
raise Exception("it worked!")