(ci/cd) move to old version of test_proxy_server_keys.py

2025-04-24 18:24:20 +00:00 · 2024-01-06 13:03:12 +05:30 · 2024-01-06 13:03:12 +05:30 · 4a076350cc
commit 4a076350cc
parent 41bfd43a48
1 changed files with 83 additions and 128 deletions
--- a/litellm/tests/test_proxy_server_keys.py
+++ b/litellm/tests/test_proxy_server_keys.py
@ -14,7 +14,6 @@ import pytest, logging
 import litellm
 from litellm import embedding, completion, completion_cost, Timeout
 from litellm import RateLimitError
-from httpx import AsyncClient

 # Configure logging
 logging.basicConfig(
@ -30,7 +29,6 @@ from litellm.proxy.proxy_server import (
    router,
    save_worker_config,
    startup_event,
-    asyncio,
 )  # Replace with the actual module where your FastAPI router is defined

 filepath = os.path.dirname(os.path.abspath(__file__))
@ -53,50 +51,27 @@ save_worker_config(
    save=False,
    use_queue=False,
 )
+app = FastAPI()
+app.include_router(router)  # Include your router in the test app


-import asyncio
-
-
-# @pytest.fixture
-# def event_loop():
-#     """Create an instance of the default event loop for each test case."""
-#     policy = asyncio.WindowsSelectorEventLoopPolicy()
-#     res = policy.new_event_loop()
-#     asyncio.set_event_loop(res)
-#     res._close = res.close
-#     res.close = lambda: None
-
-#     yield res
-
-#     res._close()
+@app.on_event("startup")
+async def wrapper_startup_event():
+    await startup_event()


 # Here you create a fixture that will be used by your tests
 # Make sure the fixture returns TestClient(app)
-@pytest.fixture(scope="function")
-async def client():
-    from litellm.proxy.proxy_server import (
-        cleanup_router_config_variables,
-        initialize,
-        ProxyLogging,
-        proxy_logging_obj,
-    )
+@pytest.fixture(autouse=True)
+def client():
+    from litellm.proxy.proxy_server import cleanup_router_config_variables

-    cleanup_router_config_variables()  # rest proxy before test
-    proxy_logging_obj = ProxyLogging(user_api_key_cache={})
-    proxy_logging_obj._init_litellm_callbacks()  # INITIALIZE LITELLM CALLBACKS ON SERVER STARTUP <- do this to catch any logging errors on startup, not when calls are being made
-
-    await initialize(config=config_fp, debug=True)
-    app = FastAPI()
-    app.include_router(router)  # Include your router in the test app
-    async with AsyncClient(app=app, base_url="http://testserver") as client:
+    cleanup_router_config_variables()
+    with TestClient(app) as client:
        yield client


-@pytest.mark.parametrize("anyio_backend", ["asyncio"])
-@pytest.mark.anyio
-async def test_add_new_key(client):
+def test_add_new_key(client):
    try:
        # Your test data
        test_data = {
@ -104,18 +79,18 @@ async def test_add_new_key(client):
            "aliases": {"mistral-7b": "gpt-3.5-turbo"},
            "duration": "20m",
        }
-        print("testing proxy server - test_add_new_key")
+        print("testing proxy server")
        # Your bearer token
        token = os.getenv("PROXY_MASTER_KEY")

        headers = {"Authorization": f"Bearer {token}"}
-        response = await client.post("/key/generate", json=test_data, headers=headers)
+        response = client.post("/key/generate", json=test_data, headers=headers)
        print(f"response: {response.text}")
        assert response.status_code == 200
        result = response.json()
        assert result["key"].startswith("sk-")

-        async def _post_data():
+        def _post_data():
            json_data = {
                "model": "azure-model",
                "messages": [
@ -125,22 +100,20 @@ async def test_add_new_key(client):
                    }
                ],
            }
-            response = await client.post(
+            response = client.post(
                "/chat/completions",
                json=json_data,
                headers={"Authorization": f"Bearer {result['key']}"},
            )
            return response

-        await _post_data()
+        _post_data()
        print(f"Received response: {result}")
    except Exception as e:
        pytest.fail(f"LiteLLM Proxy test failed. Exception: {str(e)}")


-@pytest.mark.parametrize("anyio_backend", ["asyncio"])
-@pytest.mark.anyio
-async def test_update_new_key(client):
+def test_update_new_key(client):
    try:
        # Your test data
        test_data = {
@ -148,99 +121,34 @@ async def test_update_new_key(client):
            "aliases": {"mistral-7b": "gpt-3.5-turbo"},
            "duration": "20m",
        }
-        print("testing proxy server-test_update_new_key")
+        print("testing proxy server")
        # Your bearer token
        token = os.getenv("PROXY_MASTER_KEY")

        headers = {"Authorization": f"Bearer {token}"}
-        response = await client.post("/key/generate", json=test_data, headers=headers)
+        response = client.post("/key/generate", json=test_data, headers=headers)
        print(f"response: {response.text}")
        assert response.status_code == 200
        result = response.json()
        assert result["key"].startswith("sk-")

-        async def _post_data():
+        def _post_data():
            json_data = {"models": ["bedrock-models"], "key": result["key"]}
-            response = await client.post("/key/update", json=json_data, headers=headers)
+            response = client.post("/key/update", json=json_data, headers=headers)
            print(f"response text: {response.text}")
            assert response.status_code == 200
            return response

-        await _post_data()
+        _post_data()
        print(f"Received response: {result}")
    except Exception as e:
        pytest.fail(f"LiteLLM Proxy test failed. Exception: {str(e)}")


-# Run the test - only runs via pytest
+# # Run the test - only runs via pytest


-@pytest.mark.parametrize("anyio_backend", ["asyncio"])
-@pytest.mark.anyio
-async def test_add_new_key_max_parallel_limit(client):
-    try:
-        import anyio
-
-        print("ANY IO BACKENDS")
-        print(anyio.get_all_backends())
-        # Your test data
-        test_data = {
-            "duration": "20m",
-            "max_parallel_requests": 1,
-            "metadata": {"type": "ishaan-test"},
-        }
-        # Your bearer token
-        token = os.getenv("PROXY_MASTER_KEY")
-
-        headers = {"Authorization": f"Bearer {token}"}
-
-        response = await client.post("/key/generate", json=test_data, headers=headers)
-        print(f"response: {response.text}")
-        assert response.status_code == 200
-        result = response.json()
-
-        async def _post_data():
-            json_data = {
-                "model": "azure-model",
-                "messages": [
-                    {
-                        "role": "user",
-                        "content": f"this is a test request, write a short poem {time.time()}",
-                    }
-                ],
-            }
-
-            response = await client.post(
-                "/chat/completions",
-                json=json_data,
-                headers={"Authorization": f"Bearer {result['key']}"},
-            )
-            return response
-
-        async def _run_in_parallel():
-            try:
-                futures = [_post_data() for _ in range(2)]
-                responses = await asyncio.gather(*futures)
-                print("response1 status: ", responses[0].status_code)
-                print("response2 status: ", responses[1].status_code)
-
-                if any(response.status_code == 429 for response in responses):
-                    pass
-                else:
-                    raise Exception()
-            except Exception as e:
-                pass
-
-        await _run_in_parallel()
-
-        # assert responses[0].status_code == 200 or responses[1].status_code == 200
-    except Exception as e:
-        pytest.fail(f"LiteLLM Proxy test failed. Exception: {str(e)}")
-
-
-@pytest.mark.parametrize("anyio_backend", ["asyncio"])
-@pytest.mark.anyio
-async def test_add_new_key_max_parallel_limit_streaming(client):
+def test_add_new_key_max_parallel_limit(client):
    try:
        # Your test data
        test_data = {"duration": "20m", "max_parallel_requests": 1}
@ -248,12 +156,60 @@ async def test_add_new_key_max_parallel_limit_streaming(client):
        token = os.getenv("PROXY_MASTER_KEY")

        headers = {"Authorization": f"Bearer {token}"}
-        response = await client.post("/key/generate", json=test_data, headers=headers)
+        response = client.post("/key/generate", json=test_data, headers=headers)
        print(f"response: {response.text}")
        assert response.status_code == 200
        result = response.json()

-        async def _post_data():
+        def _post_data():
+            json_data = {
+                "model": "azure-model",
+                "messages": [
+                    {
+                        "role": "user",
+                        "content": f"this is a test request, write a short poem {time.time()}",
+                    }
+                ],
+            }
+            response = client.post(
+                "/chat/completions",
+                json=json_data,
+                headers={"Authorization": f"Bearer {result['key']}"},
+            )
+            return response
+
+        def _run_in_parallel():
+            with ThreadPoolExecutor(max_workers=2) as executor:
+                future1 = executor.submit(_post_data)
+                future2 = executor.submit(_post_data)
+
+                # Obtain the results from the futures
+                response1 = future1.result()
+                response2 = future2.result()
+                if response1.status_code == 429 or response2.status_code == 429:
+                    pass
+                else:
+                    raise Exception()
+
+        _run_in_parallel()
+    except Exception as e:
+        pytest.fail(f"LiteLLM Proxy test failed. Exception: {str(e)}")
+
+
+def test_add_new_key_max_parallel_limit_streaming(client):
+    try:
+        # Your test data
+        test_data = {"duration": "20m", "max_parallel_requests": 1}
+        # Your bearer token
+        token = os.getenv("PROXY_MASTER_KEY")
+
+        headers = {"Authorization": f"Bearer {token}"}
+        response = client.post("/key/generate", json=test_data, headers=headers)
+        print(f"response: {response.text}")
+        assert response.status_code == 200
+        result = response.json()
+
+        def _post_data():
            json_data = {
                "model": "azure-model",
                "messages": [
@ -264,26 +220,25 @@ async def test_add_new_key_max_parallel_limit_streaming(client):
                ],
                "stream": True,
            }
-            response = await client.post(
+            response = client.post(
                "/chat/completions",
                json=json_data,
                headers={"Authorization": f"Bearer {result['key']}"},
            )
            return response

-        async def _run_in_parallel():
-            try:
-                futures = [_post_data() for _ in range(2)]
-                responses = await asyncio.gather(*futures)
-                print("response1 status: ", responses[0].status_code)
-                print("response2 status: ", responses[1].status_code)
+        def _run_in_parallel():
+            with ThreadPoolExecutor(max_workers=2) as executor:
+                future1 = executor.submit(_post_data)
+                future2 = executor.submit(_post_data)

-                if any(response.status_code == 429 for response in responses):
+                # Obtain the results from the futures
+                response1 = future1.result()
+                response2 = future2.result()
+                if response1.status_code == 429 or response2.status_code == 429:
                    pass
                else:
                    raise Exception()
-            except Exception as e:
-                pass

        _run_in_parallel()
    except Exception as e: