From a3baec081bd08c5aaa725050b8e872f1a9a78991 Mon Sep 17 00:00:00 2001 From: David Manouchehri Date: Fri, 8 Nov 2024 11:40:15 -0500 Subject: [PATCH] (pricing): Fix multiple mistakes in Claude pricing, and also increase context length allowed for Claude 3.5 Sonnet v2 on Bedrock. (#6666) --- ...odel_prices_and_context_window_backup.json | 28 +++++++++++-------- model_prices_and_context_window.json | 28 +++++++++++-------- 2 files changed, 32 insertions(+), 24 deletions(-) diff --git a/litellm/model_prices_and_context_window_backup.json b/litellm/model_prices_and_context_window_backup.json index cfc2cef72..a9c65b2c9 100644 --- a/litellm/model_prices_and_context_window_backup.json +++ b/litellm/model_prices_and_context_window_backup.json @@ -1886,11 +1886,13 @@ "supports_prompt_caching": true }, "claude-3-5-haiku-20241022": { - "max_tokens": 4096, + "max_tokens": 8192, "max_input_tokens": 200000, - "max_output_tokens": 4096, + "max_output_tokens": 8192, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000005, + "cache_creation_input_token_cost": 0.00000125, + "cache_read_input_token_cost": 0.0000001, "litellm_provider": "anthropic", "mode": "chat", "supports_function_calling": true, @@ -2812,9 +2814,9 @@ "supports_assistant_prefill": true }, "vertex_ai/claude-3-5-haiku@20241022": { - "max_tokens": 4096, + "max_tokens": 8192, "max_input_tokens": 200000, - "max_output_tokens": 4096, + "max_output_tokens": 8192, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000005, "litellm_provider": "vertex_ai-anthropic_models", @@ -3816,9 +3818,9 @@ "tool_use_system_prompt_tokens": 264 }, "openrouter/anthropic/claude-3-5-haiku-20241022": { - "max_tokens": 4096, + "max_tokens": 8192, "max_input_tokens": 200000, - "max_output_tokens": 4096, + "max_output_tokens": 8192, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000005, "litellm_provider": "openrouter", @@ -4529,9 +4531,9 @@ "supports_vision": true }, "anthropic.claude-3-5-sonnet-20241022-v2:0": { - "max_tokens": 4096, + "max_tokens": 8192, "max_input_tokens": 200000, - "max_output_tokens": 4096, + "max_output_tokens": 8192, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "litellm_provider": "bedrock", @@ -4559,6 +4561,7 @@ "output_cost_per_token": 0.000005, "litellm_provider": "bedrock", "mode": "chat", + "supports_assistant_prefill": true, "supports_function_calling": true }, "anthropic.claude-3-opus-20240229-v1:0": { @@ -4595,9 +4598,9 @@ "supports_vision": true }, "us.anthropic.claude-3-5-sonnet-20241022-v2:0": { - "max_tokens": 4096, + "max_tokens": 8192, "max_input_tokens": 200000, - "max_output_tokens": 4096, + "max_output_tokens": 8192, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "litellm_provider": "bedrock", @@ -4625,6 +4628,7 @@ "output_cost_per_token": 0.000005, "litellm_provider": "bedrock", "mode": "chat", + "supports_assistant_prefill": true, "supports_function_calling": true }, "us.anthropic.claude-3-opus-20240229-v1:0": { @@ -4661,9 +4665,9 @@ "supports_vision": true }, "eu.anthropic.claude-3-5-sonnet-20241022-v2:0": { - "max_tokens": 4096, + "max_tokens": 8192, "max_input_tokens": 200000, - "max_output_tokens": 4096, + "max_output_tokens": 8192, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "litellm_provider": "bedrock", diff --git a/model_prices_and_context_window.json b/model_prices_and_context_window.json index cfc2cef72..a9c65b2c9 100644 --- a/model_prices_and_context_window.json +++ b/model_prices_and_context_window.json @@ -1886,11 +1886,13 @@ "supports_prompt_caching": true }, "claude-3-5-haiku-20241022": { - "max_tokens": 4096, + "max_tokens": 8192, "max_input_tokens": 200000, - "max_output_tokens": 4096, + "max_output_tokens": 8192, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000005, + "cache_creation_input_token_cost": 0.00000125, + "cache_read_input_token_cost": 0.0000001, "litellm_provider": "anthropic", "mode": "chat", "supports_function_calling": true, @@ -2812,9 +2814,9 @@ "supports_assistant_prefill": true }, "vertex_ai/claude-3-5-haiku@20241022": { - "max_tokens": 4096, + "max_tokens": 8192, "max_input_tokens": 200000, - "max_output_tokens": 4096, + "max_output_tokens": 8192, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000005, "litellm_provider": "vertex_ai-anthropic_models", @@ -3816,9 +3818,9 @@ "tool_use_system_prompt_tokens": 264 }, "openrouter/anthropic/claude-3-5-haiku-20241022": { - "max_tokens": 4096, + "max_tokens": 8192, "max_input_tokens": 200000, - "max_output_tokens": 4096, + "max_output_tokens": 8192, "input_cost_per_token": 0.000001, "output_cost_per_token": 0.000005, "litellm_provider": "openrouter", @@ -4529,9 +4531,9 @@ "supports_vision": true }, "anthropic.claude-3-5-sonnet-20241022-v2:0": { - "max_tokens": 4096, + "max_tokens": 8192, "max_input_tokens": 200000, - "max_output_tokens": 4096, + "max_output_tokens": 8192, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "litellm_provider": "bedrock", @@ -4559,6 +4561,7 @@ "output_cost_per_token": 0.000005, "litellm_provider": "bedrock", "mode": "chat", + "supports_assistant_prefill": true, "supports_function_calling": true }, "anthropic.claude-3-opus-20240229-v1:0": { @@ -4595,9 +4598,9 @@ "supports_vision": true }, "us.anthropic.claude-3-5-sonnet-20241022-v2:0": { - "max_tokens": 4096, + "max_tokens": 8192, "max_input_tokens": 200000, - "max_output_tokens": 4096, + "max_output_tokens": 8192, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "litellm_provider": "bedrock", @@ -4625,6 +4628,7 @@ "output_cost_per_token": 0.000005, "litellm_provider": "bedrock", "mode": "chat", + "supports_assistant_prefill": true, "supports_function_calling": true }, "us.anthropic.claude-3-opus-20240229-v1:0": { @@ -4661,9 +4665,9 @@ "supports_vision": true }, "eu.anthropic.claude-3-5-sonnet-20241022-v2:0": { - "max_tokens": 4096, + "max_tokens": 8192, "max_input_tokens": 200000, - "max_output_tokens": 4096, + "max_output_tokens": 8192, "input_cost_per_token": 0.000003, "output_cost_per_token": 0.000015, "litellm_provider": "bedrock",