forked from phoenix/litellm-mirror
router - use free paid tier routing
This commit is contained in:
parent
b0f0898f2f
commit
d42963a0ae
1 changed files with 9 additions and 4 deletions
|
@ -17,14 +17,19 @@ class Deployment(TypedDict):
|
|||
|
||||
|
||||
async def get_deployments_for_tier(
|
||||
request_kwargs: dict,
|
||||
healthy_deployments: Optional[
|
||||
Union[List[DeploymentTypedDict], List[Dict[str, Any]]]
|
||||
] = None,
|
||||
request_kwargs: Optional[Dict[Any, Any]] = None,
|
||||
healthy_deployments: Optional[Union[List[Any], Dict[Any, Any]]] = None,
|
||||
):
|
||||
"""
|
||||
if request_kwargs contains {"metadata": {"tier": "free"}} or {"metadata": {"tier": "paid"}}, then routes the request to free/paid tier models
|
||||
"""
|
||||
if request_kwargs is None:
|
||||
verbose_logger.debug(
|
||||
"get_deployments_for_tier: request_kwargs is None returning healthy_deployments: %s",
|
||||
healthy_deployments,
|
||||
)
|
||||
return healthy_deployments
|
||||
|
||||
verbose_logger.debug("request metadata: %s", request_kwargs.get("metadata"))
|
||||
if "metadata" in request_kwargs:
|
||||
metadata = request_kwargs["metadata"]
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue