fix(proxy_server.py): support setting tpm/rpm limits per user / per key

2024-01-18 17:03:18 -08:00 · 2024-01-18 17:03:18 -08:00 · 1e5efdfa37
commit 1e5efdfa37
parent 5dac2402ef
5 changed files with 26 additions and 3 deletions
--- a/schema.prisma
+++ b/schema.prisma
@ -13,6 +13,9 @@ model LiteLLM_UserTable {
    spend      Float    @default(0.0)
    user_email    String?
    models     String[]
+    max_parallel_requests Int?
+    tpm_limit     BigInt?
+    rpm_limit     BigInt?
 }

 // required for token gen
@ -26,6 +29,8 @@ model LiteLLM_VerificationToken {
    user_id    String?
    max_parallel_requests Int?
    metadata   Json  @default("{}")
+    tpm_limit     BigInt?
+    rpm_limit     BigInt?
 }

 model LiteLLM_Config {