feat(proxy_server.py): team based model aliases

allow setting model aliases at a team level (e.g. route all 'gpt-3.5-turbo' requests from team-1 to model-deployment-group-2)
2025-04-25 18:54:30 +00:00 · 2024-03-06 17:42:08 -08:00 · 2024-03-06 17:42:08 -08:00 · ca97ea8acd
commit ca97ea8acd
parent cdb960eb34
5 changed files with 79 additions and 7 deletions
--- a/litellm/proxy/utils.py
+++ b/litellm/proxy/utils.py
@ -965,12 +965,21 @@ class PrismaClient:
                        )

                    sql_query = f"""
-                    SELECT *
-                    FROM "LiteLLM_VerificationTokenView"
-                    WHERE token = '{token}'
+                    SELECT 
+                    v.*,
+                    t.spend AS team_spend, 
+                    t.max_budget AS team_max_budget, 
+                    t.tpm_limit AS team_tpm_limit,
+                    t.rpm_limit AS team_rpm_limit,
+                    m.aliases as team_model_aliases
+                    FROM "LiteLLM_VerificationToken" AS v
+                    INNER JOIN "LiteLLM_TeamTable" AS t ON v.team_id = t.team_id
+                    LEFT JOIN "LiteLLM_ModelTable" m ON t.model_id = m.id
+                    WHERE v.token = '{token}'
                    """

                    response = await self.db.query_first(query=sql_query)
+
                    if response is not None:
                        response = LiteLLM_VerificationTokenView(**response)
                        # for prisma we need to cast the expires time to str