From 5bc5eaff8a28a1c452bf61e0f3d8f802b7f3e28b Mon Sep 17 00:00:00 2001 From: Krrish Dholakia Date: Wed, 25 Sep 2024 21:50:25 -0700 Subject: [PATCH] build(model_prices_and_context_window.json): add new gemini - google ai studio models Closes https://github.com/BerriAI/litellm/pull/5879#issuecomment-2375703347 --- ...odel_prices_and_context_window_backup.json | 71 +++++++++++++++++-- model_prices_and_context_window.json | 71 +++++++++++++++++-- 2 files changed, 134 insertions(+), 8 deletions(-) diff --git a/litellm/model_prices_and_context_window_backup.json b/litellm/model_prices_and_context_window_backup.json index e6707903c..0cd996289 100644 --- a/litellm/model_prices_and_context_window_backup.json +++ b/litellm/model_prices_and_context_window_backup.json @@ -2708,9 +2708,32 @@ "mode": "completion", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, + "gemini/gemini-1.5-flash-002": { + "max_tokens": 8192, + "max_input_tokens": 1048576, + "max_output_tokens": 8192, + "max_images_per_prompt": 3000, + "max_videos_per_prompt": 10, + "max_video_length": 1, + "max_audio_length_hours": 8.4, + "max_audio_per_prompt": 1, + "max_pdf_size_mb": 30, + "input_cost_per_token": 0.000000075, + "input_cost_per_token_above_128k_tokens": 0.00000015, + "output_cost_per_token": 0.0000003, + "output_cost_per_token_above_128k_tokens": 0.0000006, + "litellm_provider": "gemini", + "mode": "chat", + "supports_system_messages": true, + "supports_function_calling": true, + "supports_vision": true, + "supports_response_schema": true, + "supports_prompt_caching": true, + "source": "https://ai.google.dev/pricing" + }, "gemini/gemini-1.5-flash-001": { "max_tokens": 8192, - "max_input_tokens": 1000000, + "max_input_tokens": 1048576, "max_output_tokens": 8192, "max_images_per_prompt": 3000, "max_videos_per_prompt": 10, @@ -2733,7 +2756,7 @@ }, "gemini/gemini-1.5-flash": { "max_tokens": 8192, - "max_input_tokens": 1000000, + "max_input_tokens": 1048576, "max_output_tokens": 8192, "max_images_per_prompt": 3000, "max_videos_per_prompt": 10, @@ -2755,7 +2778,7 @@ }, "gemini/gemini-1.5-flash-latest": { "max_tokens": 8192, - "max_input_tokens": 1000000, + "max_input_tokens": 1048576, "max_output_tokens": 8192, "max_images_per_prompt": 3000, "max_videos_per_prompt": 10, @@ -2775,9 +2798,31 @@ "supports_response_schema": true, "source": "https://ai.google.dev/pricing" }, + "gemini/gemini-1.5-flash-8b-exp-0924": { + "max_tokens": 8192, + "max_input_tokens": 1048576, + "max_output_tokens": 8192, + "max_images_per_prompt": 3000, + "max_videos_per_prompt": 10, + "max_video_length": 1, + "max_audio_length_hours": 8.4, + "max_audio_per_prompt": 1, + "max_pdf_size_mb": 30, + "input_cost_per_token": 0, + "input_cost_per_token_above_128k_tokens": 0, + "output_cost_per_token": 0, + "output_cost_per_token_above_128k_tokens": 0, + "litellm_provider": "gemini", + "mode": "chat", + "supports_system_messages": true, + "supports_function_calling": true, + "supports_vision": true, + "supports_response_schema": true, + "source": "https://ai.google.dev/pricing" + }, "gemini/gemini-1.5-flash-exp-0827": { "max_tokens": 8192, - "max_input_tokens": 1000000, + "max_input_tokens": 1048576, "max_output_tokens": 8192, "max_images_per_prompt": 3000, "max_videos_per_prompt": 10, @@ -2848,6 +2893,24 @@ "supports_response_schema": true, "source": "https://ai.google.dev/pricing" }, + "gemini/gemini-1.5-pro-002": { + "max_tokens": 8192, + "max_input_tokens": 2097152, + "max_output_tokens": 8192, + "input_cost_per_token": 0.0000035, + "input_cost_per_token_above_128k_tokens": 0.000007, + "output_cost_per_token": 0.0000105, + "output_cost_per_token_above_128k_tokens": 0.000021, + "litellm_provider": "gemini", + "mode": "chat", + "supports_system_messages": true, + "supports_function_calling": true, + "supports_vision": true, + "supports_tool_choice": true, + "supports_response_schema": true, + "supports_prompt_caching": true, + "source": "https://ai.google.dev/pricing" + }, "gemini/gemini-1.5-pro-001": { "max_tokens": 8192, "max_input_tokens": 2097152, diff --git a/model_prices_and_context_window.json b/model_prices_and_context_window.json index ba664d2b2..e801788ad 100644 --- a/model_prices_and_context_window.json +++ b/model_prices_and_context_window.json @@ -2719,9 +2719,32 @@ "mode": "completion", "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#foundation_models" }, + "gemini/gemini-1.5-flash-002": { + "max_tokens": 8192, + "max_input_tokens": 1048576, + "max_output_tokens": 8192, + "max_images_per_prompt": 3000, + "max_videos_per_prompt": 10, + "max_video_length": 1, + "max_audio_length_hours": 8.4, + "max_audio_per_prompt": 1, + "max_pdf_size_mb": 30, + "input_cost_per_token": 0.000000075, + "input_cost_per_token_above_128k_tokens": 0.00000015, + "output_cost_per_token": 0.0000003, + "output_cost_per_token_above_128k_tokens": 0.0000006, + "litellm_provider": "gemini", + "mode": "chat", + "supports_system_messages": true, + "supports_function_calling": true, + "supports_vision": true, + "supports_response_schema": true, + "supports_prompt_caching": true, + "source": "https://ai.google.dev/pricing" + }, "gemini/gemini-1.5-flash-001": { "max_tokens": 8192, - "max_input_tokens": 1000000, + "max_input_tokens": 1048576, "max_output_tokens": 8192, "max_images_per_prompt": 3000, "max_videos_per_prompt": 10, @@ -2744,7 +2767,7 @@ }, "gemini/gemini-1.5-flash": { "max_tokens": 8192, - "max_input_tokens": 1000000, + "max_input_tokens": 1048576, "max_output_tokens": 8192, "max_images_per_prompt": 3000, "max_videos_per_prompt": 10, @@ -2766,7 +2789,7 @@ }, "gemini/gemini-1.5-flash-latest": { "max_tokens": 8192, - "max_input_tokens": 1000000, + "max_input_tokens": 1048576, "max_output_tokens": 8192, "max_images_per_prompt": 3000, "max_videos_per_prompt": 10, @@ -2786,9 +2809,31 @@ "supports_response_schema": true, "source": "https://ai.google.dev/pricing" }, + "gemini/gemini-1.5-flash-8b-exp-0924": { + "max_tokens": 8192, + "max_input_tokens": 1048576, + "max_output_tokens": 8192, + "max_images_per_prompt": 3000, + "max_videos_per_prompt": 10, + "max_video_length": 1, + "max_audio_length_hours": 8.4, + "max_audio_per_prompt": 1, + "max_pdf_size_mb": 30, + "input_cost_per_token": 0, + "input_cost_per_token_above_128k_tokens": 0, + "output_cost_per_token": 0, + "output_cost_per_token_above_128k_tokens": 0, + "litellm_provider": "gemini", + "mode": "chat", + "supports_system_messages": true, + "supports_function_calling": true, + "supports_vision": true, + "supports_response_schema": true, + "source": "https://ai.google.dev/pricing" + }, "gemini/gemini-1.5-flash-exp-0827": { "max_tokens": 8192, - "max_input_tokens": 1000000, + "max_input_tokens": 1048576, "max_output_tokens": 8192, "max_images_per_prompt": 3000, "max_videos_per_prompt": 10, @@ -2859,6 +2904,24 @@ "supports_response_schema": true, "source": "https://ai.google.dev/pricing" }, + "gemini/gemini-1.5-pro-002": { + "max_tokens": 8192, + "max_input_tokens": 2097152, + "max_output_tokens": 8192, + "input_cost_per_token": 0.0000035, + "input_cost_per_token_above_128k_tokens": 0.000007, + "output_cost_per_token": 0.0000105, + "output_cost_per_token_above_128k_tokens": 0.000021, + "litellm_provider": "gemini", + "mode": "chat", + "supports_system_messages": true, + "supports_function_calling": true, + "supports_vision": true, + "supports_tool_choice": true, + "supports_response_schema": true, + "supports_prompt_caching": true, + "source": "https://ai.google.dev/pricing" + }, "gemini/gemini-1.5-pro-001": { "max_tokens": 8192, "max_input_tokens": 2097152,