Add gemini-2.0-flash pricing + model info (#8303)

* add gemini-2.0-flash-001 (#8289) * build(model_prices_and_context_window.json): add gemini-2.0-flash-001 to model cost map Adds new gemini model with token based pricing to model cost map --------- Co-authored-by: kushagro <kush@orby.ai>
2025-04-24 18:24:20 +00:00 · 2025-02-05 20:49:26 -08:00 · 2025-02-05 20:49:26 -08:00 · bcfa641b81
commit bcfa641b81
parent 5e921804b9
2 changed files with 46 additions and 2 deletions
--- a/litellm/model_prices_and_context_window_backup.json
+++ b/litellm/model_prices_and_context_window_backup.json
@ -3449,7 +3449,6 @@
        "supports_response_schema": true,
        "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#gemini-1.5-flash",
        "deprecation_date": "2025-09-24",
-        "deprecation_date": "2025-09-24",
        "supports_tool_choice": true
    },
    "gemini-1.5-flash-001": {
@ -3654,6 +3653,29 @@
        "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#gemini-2.0-flash",
        "supports_tool_choice": true
    },
+    "gemini-2.0-flash-001": {
+        "max_tokens": 8192,
+        "max_input_tokens": 1048576,
+        "max_output_tokens": 8192,
+        "max_images_per_prompt": 3000,
+        "max_videos_per_prompt": 10,
+        "max_video_length": 1,
+        "max_audio_length_hours": 8.4,
+        "max_audio_per_prompt": 1,
+        "max_pdf_size_mb": 30,
+        "input_cost_per_audio_token": 0.001,
+        "input_cost_per_token": 0.00015,
+        "output_cost_per_token": 0.0006,
+        "litellm_provider": "vertex_ai-language-models",
+        "mode": "chat",
+        "supports_system_messages": true,
+        "supports_function_calling": true,
+        "supports_vision": true,
+        "supports_response_schema": true,
+        "supports_audio_output": true,
+        "supports_tool_choice": true,
+        "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#gemini-2.0-flash"
+    },
    "gemini-2.0-flash-thinking-exp": {
        "max_tokens": 8192,
        "max_input_tokens": 1048576,
--- a/model_prices_and_context_window.json
+++ b/model_prices_and_context_window.json
@ -3449,7 +3449,6 @@
        "supports_response_schema": true,
        "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#gemini-1.5-flash",
        "deprecation_date": "2025-09-24",
-        "deprecation_date": "2025-09-24",
        "supports_tool_choice": true
    },
    "gemini-1.5-flash-001": {
@ -3654,6 +3653,29 @@
        "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#gemini-2.0-flash",
        "supports_tool_choice": true
    },
+    "gemini-2.0-flash-001": {
+        "max_tokens": 8192,
+        "max_input_tokens": 1048576,
+        "max_output_tokens": 8192,
+        "max_images_per_prompt": 3000,
+        "max_videos_per_prompt": 10,
+        "max_video_length": 1,
+        "max_audio_length_hours": 8.4,
+        "max_audio_per_prompt": 1,
+        "max_pdf_size_mb": 30,
+        "input_cost_per_audio_token": 0.001,
+        "input_cost_per_token": 0.00015,
+        "output_cost_per_token": 0.0006,
+        "litellm_provider": "vertex_ai-language-models",
+        "mode": "chat",
+        "supports_system_messages": true,
+        "supports_function_calling": true,
+        "supports_vision": true,
+        "supports_response_schema": true,
+        "supports_audio_output": true,
+        "supports_tool_choice": true,
+        "source": "https://cloud.google.com/vertex-ai/generative-ai/docs/learn/models#gemini-2.0-flash"
+    },
    "gemini-2.0-flash-thinking-exp": {
        "max_tokens": 8192,
        "max_input_tokens": 1048576,