From f2d6aab8f527316ff4311bf8e0b1439885dcb3cb Mon Sep 17 00:00:00 2001 From: ishaan-jaff Date: Wed, 14 Feb 2024 17:23:25 -0800 Subject: [PATCH] (feat) proxy - use acces groups --- litellm/proxy/proxy_config.yaml | 15 +++++---------- 1 file changed, 5 insertions(+), 10 deletions(-) diff --git a/litellm/proxy/proxy_config.yaml b/litellm/proxy/proxy_config.yaml index d94f987db..74a780c71 100644 --- a/litellm/proxy/proxy_config.yaml +++ b/litellm/proxy/proxy_config.yaml @@ -9,14 +9,19 @@ model_list: mode: chat max_tokens: 4096 base_model: azure/gpt-4-1106-preview + access_groups: ["public"] - model_name: openai-gpt-3.5 litellm_params: model: gpt-3.5-turbo api_key: os.environ/OPENAI_API_KEY + model_info: + access_groups: ["public"] - model_name: anthropic-claude-v2.1 litellm_params: model: bedrock/anthropic.claude-v2:1 timeout: 300 # sets a 5 minute timeout + model_info: + access_groups: ["private"] - model_name: anthropic-claude-v2 litellm_params: model: bedrock/anthropic.claude-v2 @@ -39,16 +44,6 @@ model_list: litellm_settings: fallbacks: [{"openai-gpt-3.5": ["azure-gpt-3.5"]}] success_callback: ['langfuse'] - max_budget: 50 # global budget for proxy - max_user_budget: 0.0001 - budget_duration: 30d # global budget duration, will reset after 30d - default_key_generate_params: - max_budget: 1.5000 - models: ["azure-gpt-3.5"] - duration: None - upperbound_key_generate_params: - max_budget: 100 - duration: "30d" # setting callback class # callbacks: custom_callbacks.proxy_handler_instance # sets litellm.callbacks = [proxy_handler_instance]