Merge pull request #3954 from BerriAI/litellm_simple_request_prioritization

feat(scheduler.py): add request prioritization scheduler
2024-05-31 23:29:09 -07:00 · 2024-05-31 23:29:09 -07:00 · 8375e9621c
commit 8375e9621c
parent 04f42d7e63 183dd81087
12 changed files with 612 additions and 149 deletions
--- a/litellm/types/router.py
+++ b/litellm/types/router.py
@ -314,6 +314,8 @@ class LiteLLMParamsTypedDict(TypedDict, total=False):
    output_cost_per_token: Optional[float]
    input_cost_per_second: Optional[float]
    output_cost_per_second: Optional[float]
+    ## MOCK RESPONSES ##
+    mock_response: Optional[str]


 class DeploymentTypedDict(TypedDict):