(fix) don't block proxy startup if license check fails & using prometheus (#6839)

* fix - don't block proxy startup if not a premium user * test_litellm_proxy_server_config_with_prometheus * add test for proxy startup * fix remove unused test * fix startup test * add comment on bad-license
2024-11-20 17:55:39 -08:00 · 2024-11-20 17:55:39 -08:00 · ddfe687b13
commit ddfe687b13
parent cc1f8ff0ba
4 changed files with 113 additions and 1 deletions
--- a/.circleci/config.yml
+++ b/.circleci/config.yml
@ -1039,6 +1039,48 @@ jobs:
            ls
            python -m pytest -vv tests/otel_tests -x --junitxml=test-results/junit.xml --durations=5
          no_output_timeout: 120m
           # Clean up first container
      - run:
          name: Stop and remove first container
          command: |
            docker stop my-app
            docker rm my-app
      # Second Docker Container Run with Different Config
      # NOTE: We intentionally pass a "bad" license here. We need to ensure proxy starts and serves request even with bad license
      - run:
          name: Run Second Docker container
          command: |
            docker run -d \
              -p 4000:4000 \
              -e DATABASE_URL=$PROXY_DATABASE_URL \
              -e REDIS_HOST=$REDIS_HOST \
              -e REDIS_PASSWORD=$REDIS_PASSWORD \
              -e REDIS_PORT=$REDIS_PORT \
              -e LITELLM_MASTER_KEY="sk-1234" \
              -e OPENAI_API_KEY=$OPENAI_API_KEY \
              -e LITELLM_LICENSE="bad-license" \
              --name my-app-3 \
              -v $(pwd)/litellm/proxy/example_config_yaml/enterprise_config.yaml:/app/config.yaml \
              my-app:latest \
              --config /app/config.yaml \
              --port 4000 \
              --detailed_debug
      - run:
          name: Start outputting logs for second container
          command: docker logs -f my-app-2
          background: true
      - run:
          name: Wait for second app to be ready
          command: dockerize -wait http://localhost:4000 -timeout 5m
      - run:
          name: Run second round of tests
          command: |
            python -m pytest -vv tests/basic_proxy_startup_tests -x --junitxml=test-results/junit-2.xml --durations=5
          no_output_timeout: 120m
      # Store test results
      - store_test_results:
--- a/litellm/proxy/common_utils/callback_utils.py
+++ b/litellm/proxy/common_utils/callback_utils.py
@ -242,7 +242,9 @@ def initialize_callbacks_on_proxy(  # noqa: PLR0915
        if "prometheus" in value:
            if premium_user is not True:
-                raise Exception(CommonProxyErrors.not_premium_user.value)
+                verbose_proxy_logger.warning(
                    f"Prometheus metrics are only available for premium users. {CommonProxyErrors.not_premium_user.value}"
                )
            from litellm.proxy.proxy_server import app
            verbose_proxy_logger.debug("Starting Prometheus Metrics on /metrics")
--- a/litellm/proxy/example_config_yaml/enterprise_config.yaml
+++ b/litellm/proxy/example_config_yaml/enterprise_config.yaml
@ -0,0 +1,17 @@
 model_list:
 - model_name: gpt-4
   litellm_params:
     model: openai/fake
     api_key: fake-key
     api_base: https://exampleopenaiendpoint-production.up.railway.app/
     tags: ["teamA"]
   model_info:
     id: "team-a-model"
 litellm_settings:
  cache: true
  callbacks: ["prometheus"]
 router_settings:
  enable_tag_filtering: True # 👈 Key Change
--- a/tests/basic_proxy_startup_tests/test_basic_proxy_startup.py
+++ b/tests/basic_proxy_startup_tests/test_basic_proxy_startup.py
@ -0,0 +1,51 @@
 """
 This test ensures that the proxy starts and serves requests even with a bad license.
 in ci/cd config.yml, we set the license to "bad-license"
 """
 import pytest
 import aiohttp
 from typing import Optional
@pytest.mark.asyncio
 async def test_health_and_chat_completion():
    """
    Test health endpoints and chat completion:
    1. Check /health/readiness
    2. Check /health/liveness
    3. Make a chat completion call
    """
    async with aiohttp.ClientSession() as session:
        # Test readiness endpoint
        async with session.get("http://0.0.0.0:4000/health/readiness") as response:
            assert response.status == 200
            readiness_response = await response.json()
            assert readiness_response["status"] == "connected"
        # Test liveness endpoint
        async with session.get("http://0.0.0.0:4000/health/liveness") as response:
            assert response.status == 200
            liveness_response = await response.json()
            print("liveness_response", liveness_response)
        # Make a chat completion call
        url = "http://0.0.0.0:4000/chat/completions"
        headers = {
            "Authorization": "Bearer sk-1234",
            "Content-Type": "application/json",
        }
        data = {
            "model": "gpt-4",
            "messages": [
                {"role": "system", "content": "You are a helpful assistant."},
                {"role": "user", "content": "Hello!"},
            ],
        }
        async with session.post(url, headers=headers, json=data) as response:
            assert response.status == 200
            completion_response = await response.json()
            assert "choices" in completion_response