(round 4 fixes) - Team model alias setting (#8474)

* update team info endpoint * clean up model alias * fix model alias * fix model alias card * clean up naming on docs * fix model alias card * fix _model_in_team_aliases * team alias - fix litellm.model_alias_map * fix _update_model_if_team_alias_exists * fix test_aview_spend_per_user * Test model alias functionality with teams: * complete e2e test * test_update_model_if_team_alias_exists
2025-04-26 19:24:27 +00:00 · 2025-02-11 16:40:01 -08:00 · 2025-02-11 16:40:01 -08:00 · a449eb1dc9
commit a449eb1dc9
parent 51419338df
4 changed files with 168 additions and 15 deletions
--- a/litellm/proxy/auth/user_api_key_auth.py
+++ b/litellm/proxy/auth/user_api_key_auth.py
@ -790,21 +790,6 @@ async def _user_api_key_auth_builder(  # noqa: PLR0915
                raise Exception(
                    "Key is blocked. Update via `/key/unblock` if you're admin."
                )
            # Check 1. If token can call model
            _model_alias_map = {}
            model: Optional[str] = None
            if (
                hasattr(valid_token, "team_model_aliases")
                and valid_token.team_model_aliases is not None
            ):
                _model_alias_map = {
                    **valid_token.aliases,
                    **valid_token.team_model_aliases,
                }
            else:
                _model_alias_map = {**valid_token.aliases}
            litellm.model_alias_map = _model_alias_map
            config = valid_token.config
            if config != {}:
--- a/litellm/proxy/litellm_pre_call_utils.py
+++ b/litellm/proxy/litellm_pre_call_utils.py
@ -635,6 +635,12 @@ async def add_litellm_data_to_request(  # noqa: PLR0915
        user_api_key_dict=user_api_key_dict,
    )
    # Team Model Aliases
    _update_model_if_team_alias_exists(
        data=data,
        user_api_key_dict=user_api_key_dict,
    )
    verbose_proxy_logger.debug(
        "[PROXY] returned data from litellm_pre_call_utils: %s", data
    )
@ -664,6 +670,32 @@ async def add_litellm_data_to_request(  # noqa: PLR0915
    return data
 def _update_model_if_team_alias_exists(
    data: dict,
    user_api_key_dict: UserAPIKeyAuth,
 ) -> None:
    """
    Update the model if the team alias exists
    If a alias map has been set on a team, then we want to make the request with the model the team alias is pointing to
    eg.
        - user calls `gpt-4o`
        - team.model_alias_map = {
            "gpt-4o": "gpt-4o-team-1"
        }
        - requested_model = "gpt-4o-team-1"
    """
    _model = data.get("model")
    if (
        _model
        and user_api_key_dict.team_model_aliases
        and _model in user_api_key_dict.team_model_aliases
    ):
        data["model"] = user_api_key_dict.team_model_aliases[_model]
    return
 def _get_enforced_params(
    general_settings: Optional[dict], user_api_key_dict: UserAPIKeyAuth
 ) -> Optional[list]:
--- a/tests/proxy_unit_tests/test_proxy_utils.py
+++ b/tests/proxy_unit_tests/test_proxy_utils.py
@ -1617,3 +1617,53 @@ def test_provider_specific_header():
            "anthropic-beta": "prompt-caching-2024-07-31",
        },
    }
@pytest.mark.parametrize(
    "data, user_api_key_dict, expected_model",
    [
        # Test case 1: Model exists in team aliases
        (
            {"model": "gpt-4o"},
            UserAPIKeyAuth(
                api_key="test_key", team_model_aliases={"gpt-4o": "gpt-4o-team-1"}
            ),
            "gpt-4o-team-1",
        ),
        # Test case 2: Model doesn't exist in team aliases
        (
            {"model": "gpt-4o"},
            UserAPIKeyAuth(
                api_key="test_key", team_model_aliases={"claude-3": "claude-3-team-1"}
            ),
            "gpt-4o",
        ),
        # Test case 3: No team aliases defined
        (
            {"model": "gpt-4o"},
            UserAPIKeyAuth(api_key="test_key", team_model_aliases=None),
            "gpt-4o",
        ),
        # Test case 4: No model in request data
        (
            {"messages": []},
            UserAPIKeyAuth(
                api_key="test_key", team_model_aliases={"gpt-4o": "gpt-4o-team-1"}
            ),
            None,
        ),
    ],
 )
 def test_update_model_if_team_alias_exists(data, user_api_key_dict, expected_model):
    from litellm.proxy.litellm_pre_call_utils import _update_model_if_team_alias_exists
    # Make a copy of the input data to avoid modifying the test parameters
    test_data = data.copy()
    # Call the function
    _update_model_if_team_alias_exists(
        data=test_data, user_api_key_dict=user_api_key_dict
    )
    # Check if model was updated correctly
    assert test_data.get("model") == expected_model
--- a/tests/store_model_in_db_tests/test_team_alias.py
+++ b/tests/store_model_in_db_tests/test_team_alias.py
@ -0,0 +1,86 @@
 import pytest
 import asyncio
 import aiohttp
 import json
 from openai import AsyncOpenAI
 import uuid
 from httpx import AsyncClient
 import uuid
 import os
 TEST_MASTER_KEY = "sk-1234"
 PROXY_BASE_URL = "http://0.0.0.0:4000"
@pytest.mark.asyncio
 async def test_team_model_alias():
    """
    Test model alias functionality with teams:
    1. Add a new model with model_name="gpt-4-team1" and litellm_params.model="gpt-4o"
    2. Create a new team
    3. Update team with model_alias mapping
    4. Generate key for team
    5. Make request with aliased model name
    """
    client = AsyncClient(base_url=PROXY_BASE_URL)
    headers = {"Authorization": f"Bearer {TEST_MASTER_KEY}"}
    # Add new model
    model_response = await client.post(
        "/model/new",
        json={
            "model_name": "gpt-4o-team1",
            "litellm_params": {
                "model": "gpt-4o",
                "api_key": os.getenv("OPENAI_API_KEY"),
            },
        },
        headers=headers,
    )
    assert model_response.status_code == 200
    # Create new team
    team_response = await client.post(
        "/team/new",
        json={
            "models": ["gpt-4o-team1"],
        },
        headers=headers,
    )
    assert team_response.status_code == 200
    team_data = team_response.json()
    team_id = team_data["team_id"]
    # Update team with model alias
    update_response = await client.post(
        "/team/update",
        json={"team_id": team_id, "model_aliases": {"gpt-4o": "gpt-4o-team1"}},
        headers=headers,
    )
    assert update_response.status_code == 200
    # Generate key for team
    key_response = await client.post(
        "/key/generate", json={"team_id": team_id}, headers=headers
    )
    assert key_response.status_code == 200
    key = key_response.json()["key"]
    # Make request with model alias
    openai_client = AsyncOpenAI(api_key=key, base_url=f"{PROXY_BASE_URL}/v1")
    response = await openai_client.chat.completions.create(
        model="gpt-4o",
        messages=[{"role": "user", "content": f"Test message {uuid.uuid4()}"}],
    )
    assert response is not None, "Should get valid response when using model alias"
    # Cleanup - delete the model
    model_id = model_response.json()["model_info"]["id"]
    delete_response = await client.post(
        "/model/delete",
        json={"id": model_id},
        headers={"Authorization": f"Bearer {TEST_MASTER_KEY}"},
    )
    assert delete_response.status_code == 200