test(router_code_coverage.py): check if all router functions are dire… (#6186)

* test(router_code_coverage.py): check if all router functions are directly tested prevent regressions * docs(configs.md): document all environment variables (#6185) * docs: make it easier to find anthropic/openai prompt caching doc * aded codecov yml (#6207) * fix codecov.yaml * run ci/cd again * (refactor) caching use LLMCachingHandler for async_get_cache and set_cache (#6208) * use folder for caching * fix importing caching * fix clickhouse pyright * fix linting * fix correctly pass kwargs and args * fix test case for embedding * fix linting * fix embedding caching logic * fix refactor handle utils.py * fix test_embedding_caching_azure_individual_items_reordered * (feat) prometheus have well defined latency buckets (#6211) * fix prometheus have well defined latency buckets * use a well define latency bucket * use types file for prometheus logging * add test for LATENCY_BUCKETS * fix prom testing * fix config.yml * (refactor caching) use LLMCachingHandler for caching streaming responses (#6210) * use folder for caching * fix importing caching * fix clickhouse pyright * fix linting * fix correctly pass kwargs and args * fix test case for embedding * fix linting * fix embedding caching logic * fix refactor handle utils.py * refactor async set stream cache * fix linting * bump (#6187) * update code cov yaml * fix config.yml * add caching component to code cov * fix config.yml ci/cd * add coverage for proxy auth * (refactor caching) use common `_retrieve_from_cache` helper (#6212) * use folder for caching * fix importing caching * fix clickhouse pyright * fix linting * fix correctly pass kwargs and args * fix test case for embedding * fix linting * fix embedding caching logic * fix refactor handle utils.py * refactor async set stream cache * fix linting * refactor - use _retrieve_from_cache * refactor use _convert_cached_result_to_model_response * fix linting errors * bump: version 1.49.2 → 1.49.3 * fix code cov components * test(test_router_helpers.py): add router component unit tests * test: add additional router tests * test: add more router testing * test: add more router testing + more mock functions * ci(router_code_coverage.py): fix check --------- Co-authored-by: Ishaan Jaff <ishaanjaffer0324@gmail.com> Co-authored-by: yujonglee <yujonglee.dev@gmail.com>
2025-04-27 11:43:54 +00:00 · 2024-10-14 22:44:00 -07:00 · 2024-10-14 22:44:00 -07:00 · 8705f1af92
commit 8705f1af92
parent bcd1a52834
15 changed files with 768 additions and 164 deletions
--- a/tests/router_unit_tests/test_router_helper_utils.py
+++ b/tests/router_unit_tests/test_router_helper_utils.py
@ -0,0 +1,252 @@
+import sys
+import os
+import traceback
+from dotenv import load_dotenv
+from fastapi import Request
+from datetime import datetime
+
+sys.path.insert(
+    0, os.path.abspath("../..")
+)  # Adds the parent directory to the system path
+from litellm import Router
+import pytest
+from unittest.mock import patch, MagicMock, AsyncMock
+
+
+@pytest.fixture
+def model_list():
+    return [
+        {
+            "model_name": "gpt-3.5-turbo",
+            "litellm_params": {
+                "model": "gpt-3.5-turbo",
+                "api_key": os.getenv("OPENAI_API_KEY"),
+            },
+        },
+        {
+            "model_name": "gpt-4o",
+            "litellm_params": {
+                "model": "gpt-4o",
+                "api_key": os.getenv("OPENAI_API_KEY"),
+            },
+        },
+        {
+            "model_name": "dall-e-3",
+            "litellm_params": {
+                "model": "dall-e-3",
+                "api_key": os.getenv("OPENAI_API_KEY"),
+            },
+        },
+    ]
+
+
+def test_validate_fallbacks(model_list):
+    router = Router(model_list=model_list, fallbacks=[{"gpt-4o": "gpt-3.5-turbo"}])
+    router.validate_fallbacks(fallback_param=[{"gpt-4o": "gpt-3.5-turbo"}])
+
+
+def test_routing_strategy_init(model_list):
+    """Test if all routing strategies are initialized correctly"""
+    from litellm.types.router import RoutingStrategy
+
+    router = Router(model_list=model_list)
+    for strategy in RoutingStrategy._member_names_:
+        router.routing_strategy_init(
+            routing_strategy=strategy, routing_strategy_args={}
+        )
+
+
+def test_print_deployment(model_list):
+    """Test if the api key is masked correctly"""
+
+    router = Router(model_list=model_list)
+    deployment = {
+        "model_name": "gpt-3.5-turbo",
+        "litellm_params": {
+            "model": "gpt-3.5-turbo",
+            "api_key": os.getenv("OPENAI_API_KEY"),
+        },
+    }
+    printed_deployment = router.print_deployment(deployment)
+    assert 10 * "*" in printed_deployment["litellm_params"]["api_key"]
+
+
+def test_completion(model_list):
+    """Test if the completion function is working correctly"""
+    router = Router(model_list=model_list)
+    response = router._completion(
+        model="gpt-3.5-turbo",
+        messages=[{"role": "user", "content": "Hello, how are you?"}],
+        mock_response="I'm fine, thank you!",
+    )
+    assert response["choices"][0]["message"]["content"] == "I'm fine, thank you!"
+
+
+@pytest.mark.parametrize("sync_mode", [True, False])
+@pytest.mark.flaky(retries=6, delay=1)
+@pytest.mark.asyncio
+async def test_image_generation(model_list, sync_mode):
+    """Test if the underlying '_image_generation' function is working correctly"""
+    from litellm.types.utils import ImageResponse
+
+    router = Router(model_list=model_list)
+    if sync_mode:
+        response = router._image_generation(
+            model="dall-e-3",
+            prompt="A cute baby sea otter",
+        )
+    else:
+        response = await router._aimage_generation(
+            model="dall-e-3",
+            prompt="A cute baby sea otter",
+        )
+
+    ImageResponse.model_validate(response)
+
+
+@pytest.mark.asyncio
+async def test_router_acompletion_util(model_list):
+    """Test if the underlying '_acompletion' function is working correctly"""
+    router = Router(model_list=model_list)
+    response = await router._acompletion(
+        model="gpt-3.5-turbo",
+        messages=[{"role": "user", "content": "Hello, how are you?"}],
+        mock_response="I'm fine, thank you!",
+    )
+    assert response["choices"][0]["message"]["content"] == "I'm fine, thank you!"
+
+
+@pytest.mark.asyncio
+async def test_router_abatch_completion_one_model_multiple_requests_util(model_list):
+    """Test if the 'abatch_completion_one_model_multiple_requests' function is working correctly"""
+    router = Router(model_list=model_list)
+    response = await router.abatch_completion_one_model_multiple_requests(
+        model="gpt-3.5-turbo",
+        messages=[
+            [{"role": "user", "content": "Hello, how are you?"}],
+            [{"role": "user", "content": "Hello, how are you?"}],
+        ],
+        mock_response="I'm fine, thank you!",
+    )
+    print(response)
+    assert response[0]["choices"][0]["message"]["content"] == "I'm fine, thank you!"
+    assert response[1]["choices"][0]["message"]["content"] == "I'm fine, thank you!"
+
+
+@pytest.mark.asyncio
+async def test_router_schedule_acompletion(model_list):
+    """Test if the 'schedule_acompletion' function is working correctly"""
+    router = Router(model_list=model_list)
+    response = await router.schedule_acompletion(
+        model="gpt-3.5-turbo",
+        messages=[{"role": "user", "content": "Hello, how are you?"}],
+        mock_response="I'm fine, thank you!",
+        priority=1,
+    )
+    assert response["choices"][0]["message"]["content"] == "I'm fine, thank you!"
+
+
+@pytest.mark.asyncio
+async def test_router_arealtime(model_list):
+    """Test if the '_arealtime' function is working correctly"""
+    import litellm
+
+    router = Router(model_list=model_list)
+    with patch.object(litellm, "_arealtime", AsyncMock()) as mock_arealtime:
+        mock_arealtime.return_value = "I'm fine, thank you!"
+        await router._arealtime(
+            model="gpt-3.5-turbo",
+            messages=[{"role": "user", "content": "Hello, how are you?"}],
+        )
+
+        mock_arealtime.assert_awaited_once()
+
+
+@pytest.mark.parametrize("sync_mode", [True, False])
+@pytest.mark.asyncio
+async def test_router_function_with_fallbacks(model_list, sync_mode):
+    """Test if the router 'async_function_with_fallbacks' + 'function_with_fallbacks' are working correctly"""
+    router = Router(model_list=model_list)
+    data = {
+        "model": "gpt-3.5-turbo",
+        "messages": [{"role": "user", "content": "Hello, how are you?"}],
+        "mock_response": "I'm fine, thank you!",
+        "num_retries": 0,
+    }
+    if sync_mode:
+        response = router.function_with_fallbacks(
+            original_function=router._completion,
+            **data,
+        )
+    else:
+        response = await router.async_function_with_fallbacks(
+            original_function=router._acompletion,
+            **data,
+        )
+    assert response.choices[0].message.content == "I'm fine, thank you!"
+
+
+@pytest.mark.parametrize("sync_mode", [True, False])
+@pytest.mark.asyncio
+async def test_router_function_with_retries(model_list, sync_mode):
+    """Test if the router 'async_function_with_retries' + 'function_with_retries' are working correctly"""
+    router = Router(model_list=model_list)
+    data = {
+        "model": "gpt-3.5-turbo",
+        "messages": [{"role": "user", "content": "Hello, how are you?"}],
+        "mock_response": "I'm fine, thank you!",
+        "num_retries": 0,
+    }
+    if sync_mode:
+        response = router.function_with_retries(
+            original_function=router._completion,
+            **data,
+        )
+    else:
+        response = await router.async_function_with_retries(
+            original_function=router._acompletion,
+            **data,
+        )
+    assert response.choices[0].message.content == "I'm fine, thank you!"
+
+
+@pytest.mark.asyncio
+async def test_router_make_call(model_list):
+    """Test if the router 'make_call' function is working correctly"""
+
+    ## ACOMPLETION
+    router = Router(model_list=model_list)
+    response = await router.make_call(
+        original_function=router._acompletion,
+        model="gpt-3.5-turbo",
+        messages=[{"role": "user", "content": "Hello, how are you?"}],
+        mock_response="I'm fine, thank you!",
+    )
+    assert response.choices[0].message.content == "I'm fine, thank you!"
+
+    ## ATEXT_COMPLETION
+    response = await router.make_call(
+        original_function=router._atext_completion,
+        model="gpt-3.5-turbo",
+        prompt="Hello, how are you?",
+        mock_response="I'm fine, thank you!",
+    )
+    assert response.choices[0].text == "I'm fine, thank you!"
+
+    ## AEMBEDDING
+    response = await router.make_call(
+        original_function=router._aembedding,
+        model="gpt-3.5-turbo",
+        input="Hello, how are you?",
+        mock_response=[0.1, 0.2, 0.3],
+    )
+    assert response.data[0].embedding == [0.1, 0.2, 0.3]
+
+    ## AIMAGE_GENERATION
+    response = await router.make_call(
+        original_function=router._aimage_generation,
+        model="dall-e-3",
+        prompt="A cute baby sea otter",
+        mock_response="https://example.com/image.png",
+    )
+    assert response.data[0].url == "https://example.com/image.png"