fix(proxy_server.py): support setting tpm/rpm limits per user / per key

This commit is contained in:
Krrish Dholakia 2024-01-18 17:03:18 -08:00
parent 5dac2402ef
commit 1e5efdfa37
5 changed files with 26 additions and 3 deletions

View file

@ -13,6 +13,9 @@ model LiteLLM_UserTable {
spend Float @default(0.0)
user_email String?
models String[]
max_parallel_requests Int?
tpm_limit BigInt?
rpm_limit BigInt?
}
// required for token gen
@ -26,6 +29,8 @@ model LiteLLM_VerificationToken {
user_id String?
max_parallel_requests Int?
metadata Json @default("{}")
tpm_limit BigInt?
rpm_limit BigInt?
}
model LiteLLM_Config {