(ci/cd) move to old version of test_proxy_server_keys.py

This commit is contained in:
ishaan-jaff 2024-01-06 13:03:12 +05:30
parent 41bfd43a48
commit 4a076350cc

View file

@ -14,7 +14,6 @@ import pytest, logging
import litellm import litellm
from litellm import embedding, completion, completion_cost, Timeout from litellm import embedding, completion, completion_cost, Timeout
from litellm import RateLimitError from litellm import RateLimitError
from httpx import AsyncClient
# Configure logging # Configure logging
logging.basicConfig( logging.basicConfig(
@ -30,7 +29,6 @@ from litellm.proxy.proxy_server import (
router, router,
save_worker_config, save_worker_config,
startup_event, startup_event,
asyncio,
) # Replace with the actual module where your FastAPI router is defined ) # Replace with the actual module where your FastAPI router is defined
filepath = os.path.dirname(os.path.abspath(__file__)) filepath = os.path.dirname(os.path.abspath(__file__))
@ -53,50 +51,27 @@ save_worker_config(
save=False, save=False,
use_queue=False, use_queue=False,
) )
app = FastAPI()
app.include_router(router) # Include your router in the test app
import asyncio @app.on_event("startup")
async def wrapper_startup_event():
await startup_event()
# @pytest.fixture
# def event_loop():
# """Create an instance of the default event loop for each test case."""
# policy = asyncio.WindowsSelectorEventLoopPolicy()
# res = policy.new_event_loop()
# asyncio.set_event_loop(res)
# res._close = res.close
# res.close = lambda: None
# yield res
# res._close()
# Here you create a fixture that will be used by your tests # Here you create a fixture that will be used by your tests
# Make sure the fixture returns TestClient(app) # Make sure the fixture returns TestClient(app)
@pytest.fixture(scope="function") @pytest.fixture(autouse=True)
async def client(): def client():
from litellm.proxy.proxy_server import ( from litellm.proxy.proxy_server import cleanup_router_config_variables
cleanup_router_config_variables,
initialize,
ProxyLogging,
proxy_logging_obj,
)
cleanup_router_config_variables() # rest proxy before test cleanup_router_config_variables()
proxy_logging_obj = ProxyLogging(user_api_key_cache={}) with TestClient(app) as client:
proxy_logging_obj._init_litellm_callbacks() # INITIALIZE LITELLM CALLBACKS ON SERVER STARTUP <- do this to catch any logging errors on startup, not when calls are being made
await initialize(config=config_fp, debug=True)
app = FastAPI()
app.include_router(router) # Include your router in the test app
async with AsyncClient(app=app, base_url="http://testserver") as client:
yield client yield client
@pytest.mark.parametrize("anyio_backend", ["asyncio"]) def test_add_new_key(client):
@pytest.mark.anyio
async def test_add_new_key(client):
try: try:
# Your test data # Your test data
test_data = { test_data = {
@ -104,18 +79,18 @@ async def test_add_new_key(client):
"aliases": {"mistral-7b": "gpt-3.5-turbo"}, "aliases": {"mistral-7b": "gpt-3.5-turbo"},
"duration": "20m", "duration": "20m",
} }
print("testing proxy server - test_add_new_key") print("testing proxy server")
# Your bearer token # Your bearer token
token = os.getenv("PROXY_MASTER_KEY") token = os.getenv("PROXY_MASTER_KEY")
headers = {"Authorization": f"Bearer {token}"} headers = {"Authorization": f"Bearer {token}"}
response = await client.post("/key/generate", json=test_data, headers=headers) response = client.post("/key/generate", json=test_data, headers=headers)
print(f"response: {response.text}") print(f"response: {response.text}")
assert response.status_code == 200 assert response.status_code == 200
result = response.json() result = response.json()
assert result["key"].startswith("sk-") assert result["key"].startswith("sk-")
async def _post_data(): def _post_data():
json_data = { json_data = {
"model": "azure-model", "model": "azure-model",
"messages": [ "messages": [
@ -125,22 +100,20 @@ async def test_add_new_key(client):
} }
], ],
} }
response = await client.post( response = client.post(
"/chat/completions", "/chat/completions",
json=json_data, json=json_data,
headers={"Authorization": f"Bearer {result['key']}"}, headers={"Authorization": f"Bearer {result['key']}"},
) )
return response return response
await _post_data() _post_data()
print(f"Received response: {result}") print(f"Received response: {result}")
except Exception as e: except Exception as e:
pytest.fail(f"LiteLLM Proxy test failed. Exception: {str(e)}") pytest.fail(f"LiteLLM Proxy test failed. Exception: {str(e)}")
@pytest.mark.parametrize("anyio_backend", ["asyncio"]) def test_update_new_key(client):
@pytest.mark.anyio
async def test_update_new_key(client):
try: try:
# Your test data # Your test data
test_data = { test_data = {
@ -148,99 +121,34 @@ async def test_update_new_key(client):
"aliases": {"mistral-7b": "gpt-3.5-turbo"}, "aliases": {"mistral-7b": "gpt-3.5-turbo"},
"duration": "20m", "duration": "20m",
} }
print("testing proxy server-test_update_new_key") print("testing proxy server")
# Your bearer token # Your bearer token
token = os.getenv("PROXY_MASTER_KEY") token = os.getenv("PROXY_MASTER_KEY")
headers = {"Authorization": f"Bearer {token}"} headers = {"Authorization": f"Bearer {token}"}
response = await client.post("/key/generate", json=test_data, headers=headers) response = client.post("/key/generate", json=test_data, headers=headers)
print(f"response: {response.text}") print(f"response: {response.text}")
assert response.status_code == 200 assert response.status_code == 200
result = response.json() result = response.json()
assert result["key"].startswith("sk-") assert result["key"].startswith("sk-")
async def _post_data(): def _post_data():
json_data = {"models": ["bedrock-models"], "key": result["key"]} json_data = {"models": ["bedrock-models"], "key": result["key"]}
response = await client.post("/key/update", json=json_data, headers=headers) response = client.post("/key/update", json=json_data, headers=headers)
print(f"response text: {response.text}") print(f"response text: {response.text}")
assert response.status_code == 200 assert response.status_code == 200
return response return response
await _post_data() _post_data()
print(f"Received response: {result}") print(f"Received response: {result}")
except Exception as e: except Exception as e:
pytest.fail(f"LiteLLM Proxy test failed. Exception: {str(e)}") pytest.fail(f"LiteLLM Proxy test failed. Exception: {str(e)}")
# Run the test - only runs via pytest # # Run the test - only runs via pytest
@pytest.mark.parametrize("anyio_backend", ["asyncio"]) def test_add_new_key_max_parallel_limit(client):
@pytest.mark.anyio
async def test_add_new_key_max_parallel_limit(client):
try:
import anyio
print("ANY IO BACKENDS")
print(anyio.get_all_backends())
# Your test data
test_data = {
"duration": "20m",
"max_parallel_requests": 1,
"metadata": {"type": "ishaan-test"},
}
# Your bearer token
token = os.getenv("PROXY_MASTER_KEY")
headers = {"Authorization": f"Bearer {token}"}
response = await client.post("/key/generate", json=test_data, headers=headers)
print(f"response: {response.text}")
assert response.status_code == 200
result = response.json()
async def _post_data():
json_data = {
"model": "azure-model",
"messages": [
{
"role": "user",
"content": f"this is a test request, write a short poem {time.time()}",
}
],
}
response = await client.post(
"/chat/completions",
json=json_data,
headers={"Authorization": f"Bearer {result['key']}"},
)
return response
async def _run_in_parallel():
try:
futures = [_post_data() for _ in range(2)]
responses = await asyncio.gather(*futures)
print("response1 status: ", responses[0].status_code)
print("response2 status: ", responses[1].status_code)
if any(response.status_code == 429 for response in responses):
pass
else:
raise Exception()
except Exception as e:
pass
await _run_in_parallel()
# assert responses[0].status_code == 200 or responses[1].status_code == 200
except Exception as e:
pytest.fail(f"LiteLLM Proxy test failed. Exception: {str(e)}")
@pytest.mark.parametrize("anyio_backend", ["asyncio"])
@pytest.mark.anyio
async def test_add_new_key_max_parallel_limit_streaming(client):
try: try:
# Your test data # Your test data
test_data = {"duration": "20m", "max_parallel_requests": 1} test_data = {"duration": "20m", "max_parallel_requests": 1}
@ -248,12 +156,60 @@ async def test_add_new_key_max_parallel_limit_streaming(client):
token = os.getenv("PROXY_MASTER_KEY") token = os.getenv("PROXY_MASTER_KEY")
headers = {"Authorization": f"Bearer {token}"} headers = {"Authorization": f"Bearer {token}"}
response = await client.post("/key/generate", json=test_data, headers=headers) response = client.post("/key/generate", json=test_data, headers=headers)
print(f"response: {response.text}") print(f"response: {response.text}")
assert response.status_code == 200 assert response.status_code == 200
result = response.json() result = response.json()
async def _post_data(): def _post_data():
json_data = {
"model": "azure-model",
"messages": [
{
"role": "user",
"content": f"this is a test request, write a short poem {time.time()}",
}
],
}
response = client.post(
"/chat/completions",
json=json_data,
headers={"Authorization": f"Bearer {result['key']}"},
)
return response
def _run_in_parallel():
with ThreadPoolExecutor(max_workers=2) as executor:
future1 = executor.submit(_post_data)
future2 = executor.submit(_post_data)
# Obtain the results from the futures
response1 = future1.result()
response2 = future2.result()
if response1.status_code == 429 or response2.status_code == 429:
pass
else:
raise Exception()
_run_in_parallel()
except Exception as e:
pytest.fail(f"LiteLLM Proxy test failed. Exception: {str(e)}")
def test_add_new_key_max_parallel_limit_streaming(client):
try:
# Your test data
test_data = {"duration": "20m", "max_parallel_requests": 1}
# Your bearer token
token = os.getenv("PROXY_MASTER_KEY")
headers = {"Authorization": f"Bearer {token}"}
response = client.post("/key/generate", json=test_data, headers=headers)
print(f"response: {response.text}")
assert response.status_code == 200
result = response.json()
def _post_data():
json_data = { json_data = {
"model": "azure-model", "model": "azure-model",
"messages": [ "messages": [
@ -264,26 +220,25 @@ async def test_add_new_key_max_parallel_limit_streaming(client):
], ],
"stream": True, "stream": True,
} }
response = await client.post( response = client.post(
"/chat/completions", "/chat/completions",
json=json_data, json=json_data,
headers={"Authorization": f"Bearer {result['key']}"}, headers={"Authorization": f"Bearer {result['key']}"},
) )
return response return response
async def _run_in_parallel(): def _run_in_parallel():
try: with ThreadPoolExecutor(max_workers=2) as executor:
futures = [_post_data() for _ in range(2)] future1 = executor.submit(_post_data)
responses = await asyncio.gather(*futures) future2 = executor.submit(_post_data)
print("response1 status: ", responses[0].status_code)
print("response2 status: ", responses[1].status_code)
if any(response.status_code == 429 for response in responses): # Obtain the results from the futures
response1 = future1.result()
response2 = future2.result()
if response1.status_code == 429 or response2.status_code == 429:
pass pass
else: else:
raise Exception() raise Exception()
except Exception as e:
pass
_run_in_parallel() _run_in_parallel()
except Exception as e: except Exception as e: