diff --git a/litellm/model_prices_and_context_window_backup.json b/litellm/model_prices_and_context_window_backup.json index 6b2aee81ff..17e874d050 100644 --- a/litellm/model_prices_and_context_window_backup.json +++ b/litellm/model_prices_and_context_window_backup.json @@ -161,6 +161,30 @@ "search_context_size_high": 0.030 } }, + "gpt-4.1-mini-2025-04-14":{ + "max_input_tokens": 1014808, + "max_output_tokens": 32768, + "input_cost_per_token": 0.0000004, + "output_cost_per_token": 0.0000016, + "cache_read_input_token_cost": 0.0000001, + "input_cost_per_token_batches": 0.0000002, + "output_cost_per_token_batches": 0.0000008, + "litellm_provider": "openai", + "mode": "chat", + "supports_function_calling": true, + "supports_parallel_function_calling": true, + "supports_response_schema": true, + "supports_vision": true, + "supports_prompt_caching": true, + "supports_system_messages": true, + "supports_tool_choice": true, + "supports_web_search": true, + "search_context_cost_per_query": { + "search_context_size_low": 0.025, + "search_context_size_medium": 0.0275, + "search_context_size_high": 0.030 + } + }, "gpt-4.1-nano": { "max_input_tokens": 1014808, "max_output_tokens": 32768, @@ -185,6 +209,30 @@ "search_context_size_high": 0.030 } }, + "gpt-4.1-nano-2025-04-14": { + "max_input_tokens": 1014808, + "max_output_tokens": 32768, + "input_cost_per_token": 0.0000001, + "output_cost_per_token": 0.0000004, + "cache_read_input_token_cost": 0.000000025, + "input_cost_per_token_batches": 0.00000005, + "output_cost_per_token_batches": 0.00000020, + "litellm_provider": "openai", + "mode": "chat", + "supports_function_calling": true, + "supports_parallel_function_calling": true, + "supports_response_schema": true, + "supports_vision": true, + "supports_prompt_caching": true, + "supports_system_messages": true, + "supports_tool_choice": true, + "supports_web_search": true, + "search_context_cost_per_query": { + "search_context_size_low": 0.025, + "search_context_size_medium": 0.0275, + "search_context_size_high": 0.030 + } + }, "watsonx/ibm/granite-3-8b-instruct": { "max_tokens": 8192, "max_input_tokens": 8192, diff --git a/model_prices_and_context_window.json b/model_prices_and_context_window.json index 6b2aee81ff..17e874d050 100644 --- a/model_prices_and_context_window.json +++ b/model_prices_and_context_window.json @@ -161,6 +161,30 @@ "search_context_size_high": 0.030 } }, + "gpt-4.1-mini-2025-04-14":{ + "max_input_tokens": 1014808, + "max_output_tokens": 32768, + "input_cost_per_token": 0.0000004, + "output_cost_per_token": 0.0000016, + "cache_read_input_token_cost": 0.0000001, + "input_cost_per_token_batches": 0.0000002, + "output_cost_per_token_batches": 0.0000008, + "litellm_provider": "openai", + "mode": "chat", + "supports_function_calling": true, + "supports_parallel_function_calling": true, + "supports_response_schema": true, + "supports_vision": true, + "supports_prompt_caching": true, + "supports_system_messages": true, + "supports_tool_choice": true, + "supports_web_search": true, + "search_context_cost_per_query": { + "search_context_size_low": 0.025, + "search_context_size_medium": 0.0275, + "search_context_size_high": 0.030 + } + }, "gpt-4.1-nano": { "max_input_tokens": 1014808, "max_output_tokens": 32768, @@ -185,6 +209,30 @@ "search_context_size_high": 0.030 } }, + "gpt-4.1-nano-2025-04-14": { + "max_input_tokens": 1014808, + "max_output_tokens": 32768, + "input_cost_per_token": 0.0000001, + "output_cost_per_token": 0.0000004, + "cache_read_input_token_cost": 0.000000025, + "input_cost_per_token_batches": 0.00000005, + "output_cost_per_token_batches": 0.00000020, + "litellm_provider": "openai", + "mode": "chat", + "supports_function_calling": true, + "supports_parallel_function_calling": true, + "supports_response_schema": true, + "supports_vision": true, + "supports_prompt_caching": true, + "supports_system_messages": true, + "supports_tool_choice": true, + "supports_web_search": true, + "search_context_cost_per_query": { + "search_context_size_low": 0.025, + "search_context_size_medium": 0.0275, + "search_context_size_high": 0.030 + } + }, "watsonx/ibm/granite-3-8b-instruct": { "max_tokens": 8192, "max_input_tokens": 8192,