feat(router.py): allow user to call specific deployment via id

Allows easier health checks for specific deployments by just passing in model id
This commit is contained in:
Krrish Dholakia 2024-06-19 13:02:46 -07:00
parent 9cc104eb03
commit 16889b8478
3 changed files with 42 additions and 0 deletions

View file

@ -3005,6 +3005,10 @@ async def chat_completion(
llm_router is not None and data["model"] in router_model_names
): # model in router model list
tasks.append(llm_router.acompletion(**data))
elif (
llm_router is not None and data["model"] in llm_router.get_model_ids()
): # model in router model list
tasks.append(llm_router.acompletion(**data))
elif (
llm_router is not None
and llm_router.model_group_alias is not None
@ -3256,6 +3260,10 @@ async def completion(
llm_response = asyncio.create_task(
llm_router.atext_completion(**data, specific_deployment=True)
)
elif (
llm_router is not None and data["model"] in llm_router.get_model_ids()
): # model in router model list
llm_response = asyncio.create_task(llm_router.atext_completion(**data))
elif (
llm_router is not None
and data["model"] not in router_model_names
@ -3488,6 +3496,10 @@ async def embeddings(
llm_router is not None and data["model"] in llm_router.deployment_names
): # model in router deployments, calling a specific deployment on the router
response = await llm_router.aembedding(**data, specific_deployment=True)
elif (
llm_router is not None and data["model"] in llm_router.get_model_ids()
): # model in router deployments, calling a specific deployment on the router
response = await llm_router.aembedding(**data)
elif (
llm_router is not None
and data["model"] not in router_model_names

View file

@ -4294,6 +4294,15 @@ class Router:
raise ValueError(
f"LiteLLM Router: Trying to call specific deployment, but Model:{model} does not exist in Model List: {self.model_list}"
)
elif model in self.get_model_ids():
deployment = self.get_model_info(id=model)
if deployment is not None:
deployment_model = deployment.get("litellm_params", {}).get("model")
return deployment_model, deployment
raise ValueError(
f"LiteLLM Router: Trying to call specific deployment, but Model ID :{model} does not exist in \
Model ID List: {self.get_model_ids}"
)
if model in self.model_group_alias:
verbose_router_logger.debug(

View file

@ -49,6 +49,27 @@ def test_router_multi_org_list():
assert len(router.get_model_list()) == 3
def test_router_specific_model_via_id():
"""
Call a specific deployment by it's id
"""
router = Router(
model_list=[
{
"model_name": "gpt-3.5-turbo",
"litellm_params": {
"model": "gpt-3.5-turbo",
"api_key": "my-fake-key",
"mock_response": "Hello world",
},
"model_info": {"id": "1234"},
}
]
)
router.completion(model="1234", messages=[{"role": "user", "content": "Hey!"}])
def test_router_sensitive_keys():
try:
router = Router(