feat - set custom routing strategy

2025-04-27 03:34:10 +00:00 · 2024-06-20 13:49:44 -07:00 · 2024-06-20 13:49:44 -07:00 · 7ce2aa83c1
commit 7ce2aa83c1
parent 1a4467c1a5
3 changed files with 45 additions and 1 deletions
--- a/litellm/model_prices_and_context_window_backup.json
+++ b/litellm/model_prices_and_context_window_backup.json
@ -865,7 +865,7 @@
    },
    "deepseek-coder": {
        "max_tokens": 4096,
-        "max_input_tokens": 16000,
+        "max_input_tokens": 32000,
        "max_output_tokens": 4096,
        "input_cost_per_token": 0.00000014,
        "output_cost_per_token": 0.00000028,
@ -1984,6 +1984,15 @@
        "litellm_provider": "replicate",
        "mode": "chat"
    },
    "openrouter/deepseek/deepseek-coder": {
        "max_tokens": 4096,
        "max_input_tokens": 32000,
        "max_output_tokens": 4096,
        "input_cost_per_token": 0.00000014,
        "output_cost_per_token": 0.00000028,
        "litellm_provider": "openrouter",
        "mode": "chat"
    },
    "openrouter/microsoft/wizardlm-2-8x22b:nitro": {
        "max_tokens": 65536,
        "input_cost_per_token": 0.000001,
--- a/litellm/router.py
+++ b/litellm/router.py
@ -69,6 +69,7 @@ from litellm.types.router import (
    AlertingConfig,
    AllowedFailsPolicy,
    AssistantsTypedDict,
    CustomRoutingStrategy,
    Deployment,
    DeploymentTypedDict,
    LiteLLM_Params,
@ -4814,6 +4815,18 @@ class Router:
        except Exception as e:
            pass
    def set_custom_routing_strategy(self, CustomRoutingStrategy: CustomRoutingStrategy):
        setattr(
            self,
            "get_available_deployment",
            CustomRoutingStrategy.get_available_deployment,
        )
        setattr(
            self,
            "async_get_available_deployment",
            CustomRoutingStrategy.async_get_available_deployment,
        )
    def flush_cache(self):
        litellm.cache = None
        self.cache.flush_cache()
--- a/litellm/types/router.py
+++ b/litellm/types/router.py
@ -451,3 +451,25 @@ class ModelGroupInfo(BaseModel):
 class AssistantsTypedDict(TypedDict):
    custom_llm_provider: Literal["azure", "openai"]
    litellm_params: LiteLLMParamsTypedDict
 class CustomRoutingStrategy:
    async def async_get_available_deployment(
        self,
        model: str,
        messages: Optional[List[Dict[str, str]]] = None,
        input: Optional[Union[str, List]] = None,
        specific_deployment: Optional[bool] = False,
        request_kwargs: Optional[Dict] = None,
    ):
        pass
    def get_available_deployment(
        self,
        model: str,
        messages: Optional[List[Dict[str, str]]] = None,
        input: Optional[Union[str, List]] = None,
        specific_deployment: Optional[bool] = False,
        request_kwargs: Optional[Dict] = None,
    ):
        pass