(test) proxy - use, user provided model_list

2024-01-02 12:06:40 +05:30 · 2024-01-02 12:06:40 +05:30 · 31a896908b
commit 31a896908b
parent ddc31c4810
1 changed files with 92 additions and 0 deletions
--- a/litellm/tests/test_proxy_pass_user_config.py
+++ b/litellm/tests/test_proxy_pass_user_config.py
@ -0,0 +1,92 @@
+import sys, os
+import traceback
+from dotenv import load_dotenv
+
+load_dotenv()
+import os, io
+
+# this file is to test litellm/proxy
+
+sys.path.insert(
+    0, os.path.abspath("../..")
+)  # Adds the parent directory to the system path
+import pytest, logging
+import litellm
+from litellm import embedding, completion, completion_cost, Timeout
+from litellm import RateLimitError
+
+# Configure logging
+logging.basicConfig(
+    level=logging.DEBUG,  # Set the desired logging level
+    format="%(asctime)s - %(levelname)s - %(message)s",
+)
+
+# test /chat/completion request to the proxy
+from fastapi.testclient import TestClient
+from fastapi import FastAPI
+from litellm.proxy.proxy_server import (
+    router,
+    save_worker_config,
+    initialize,
+)  # Replace with the actual module where your FastAPI router is defined
+
+# Your bearer token
+token = ""
+
+headers = {"Authorization": f"Bearer {token}"}
+
+
+@pytest.fixture(scope="function")
+def client_no_auth():
+    # Assuming litellm.proxy.proxy_server is an object
+    from litellm.proxy.proxy_server import cleanup_router_config_variables
+
+    cleanup_router_config_variables()
+    filepath = os.path.dirname(os.path.abspath(__file__))
+    config_fp = f"{filepath}/test_configs/test_config_no_auth.yaml"
+    # initialize can get run in parallel, it sets specific variables for the fast api app, sinc eit gets run in parallel different tests use the wrong variables
+    initialize(config=config_fp, debug=True)
+    app = FastAPI()
+    app.include_router(router)  # Include your router in the test app
+
+    return TestClient(app)
+
+
+def test_chat_completion(client_no_auth):
+    global headers
+    try:
+        # Your test data
+        test_data = {
+            "model": "user-azure-instance",
+            "messages": [
+                {"role": "user", "content": "hi"},
+            ],
+            "max_tokens": 10,
+            "user_config": {
+                "model_list": [
+                    {
+                        "model_name": "user-azure-instance",  # openai model name
+                        "litellm_params": {  # params for litellm completion/embedding call
+                            "model": "azure/chatgpt-v-2",
+                            "api_key": os.getenv("AZURE_API_KEY"),
+                            "api_version": os.getenv("AZURE_API_VERSION"),
+                            "api_base": os.getenv("AZURE_API_BASE"),
+                        },
+                        "tpm": 240000,
+                        "rpm": 1800,
+                    }
+                ]
+            },
+        }
+
+        print("testing proxy server with chat completions")
+        response = client_no_auth.post("/v1/chat/completions", json=test_data)
+        print(f"response - {response.text}")
+        assert response.status_code == 200
+        result = response.json()
+        print(f"Received response: {result}")
+    except Exception as e:
+        pytest.fail(f"LiteLLM Proxy test failed. Exception - {str(e)}")
+
+
+# Run the test