(test) proxy - use, user provided model_list

2024-01-02 12:06:40 +05:30 · 2024-01-02 12:06:40 +05:30 · 31a896908b
commit 31a896908b
parent ddc31c4810
1 changed files with 92 additions and 0 deletions
--- a/litellm/tests/test_proxy_pass_user_config.py
+++ b/litellm/tests/test_proxy_pass_user_config.py
@ -0,0 +1,92 @@
 import sys, os
 import traceback
 from dotenv import load_dotenv
 load_dotenv()
 import os, io
 # this file is to test litellm/proxy
 sys.path.insert(
    0, os.path.abspath("../..")
 )  # Adds the parent directory to the system path
 import pytest, logging
 import litellm
 from litellm import embedding, completion, completion_cost, Timeout
 from litellm import RateLimitError
 # Configure logging
 logging.basicConfig(
    level=logging.DEBUG,  # Set the desired logging level
    format="%(asctime)s - %(levelname)s - %(message)s",
 )
 # test /chat/completion request to the proxy
 from fastapi.testclient import TestClient
 from fastapi import FastAPI
 from litellm.proxy.proxy_server import (
    router,
    save_worker_config,
    initialize,
 )  # Replace with the actual module where your FastAPI router is defined
 # Your bearer token
 token = ""
 headers = {"Authorization": f"Bearer {token}"}
@pytest.fixture(scope="function")
 def client_no_auth():
    # Assuming litellm.proxy.proxy_server is an object
    from litellm.proxy.proxy_server import cleanup_router_config_variables
    cleanup_router_config_variables()
    filepath = os.path.dirname(os.path.abspath(__file__))
    config_fp = f"{filepath}/test_configs/test_config_no_auth.yaml"
    # initialize can get run in parallel, it sets specific variables for the fast api app, sinc eit gets run in parallel different tests use the wrong variables
    initialize(config=config_fp, debug=True)
    app = FastAPI()
    app.include_router(router)  # Include your router in the test app
    return TestClient(app)
 def test_chat_completion(client_no_auth):
    global headers
    try:
        # Your test data
        test_data = {
            "model": "user-azure-instance",
            "messages": [
                {"role": "user", "content": "hi"},
            ],
            "max_tokens": 10,
            "user_config": {
                "model_list": [
                    {
                        "model_name": "user-azure-instance",  # openai model name
                        "litellm_params": {  # params for litellm completion/embedding call
                            "model": "azure/chatgpt-v-2",
                            "api_key": os.getenv("AZURE_API_KEY"),
                            "api_version": os.getenv("AZURE_API_VERSION"),
                            "api_base": os.getenv("AZURE_API_BASE"),
                        },
                        "tpm": 240000,
                        "rpm": 1800,
                    }
                ]
            },
        }
        print("testing proxy server with chat completions")
        response = client_no_auth.post("/v1/chat/completions", json=test_data)
        print(f"response - {response.text}")
        assert response.status_code == 200
        result = response.json()
        print(f"Received response: {result}")
    except Exception as e:
        pytest.fail(f"LiteLLM Proxy test failed. Exception - {str(e)}")
 # Run the test