Cost tracking for gemini-2.5-pro (#9837)

* build(model_prices_and_context_window.json): add google/gemini-2.0-flash-lite-001 versioned pricing Closes https://github.com/BerriAI/litellm/issues/9829 * build(model_prices_and_context_window.json): add initial support for 'supported_output_modalities' param * build(model_prices_and_context_window.json): add initial support for 'supported_output_modalities' param * build(model_prices_and_context_window.json): add supported endpoints to gemini-2.5-pro * build(model_prices_and_context_window.json): add gemini 200k+ pricing * feat(utils.py): support cost calculation for gemini-2.5-pro above 200k tokens Fixes https://github.com/BerriAI/litellm/issues/9807 * build: test dockerfile change * build: revert apk change * ci(config.yml): pip install wheel * ci: test problematic package first * ci(config.yml): pip install only binary * ci: try more things * ci: test different ml_dtypes version * ci(config.yml): check ml_dtypes==0.4.0 * ci: test * ci: cleanup config.yml * ci: specify ml dtypes in requirements.txt * ci: remove redisvl depedency (temporary) * fix: fix linting errors * test: update test * test: fix test
2025-04-26 03:04:13 +00:00 · 2025-04-09 18:48:43 -07:00 · 2025-04-09 18:48:43 -07:00 · ac4f32fb1e
commit ac4f32fb1e
parent 4c1bb74c3d
10 changed files with 251 additions and 91 deletions
--- a/tests/local_testing/test_get_model_info.py
+++ b/tests/local_testing/test_get_model_info.py
@ -431,6 +431,7 @@ def test_aaamodel_prices_and_context_window_json_is_valid():
                "input_cost_per_character_above_128k_tokens": {"type": "number"},
                "input_cost_per_image": {"type": "number"},
                "input_cost_per_image_above_128k_tokens": {"type": "number"},
+                "input_cost_per_token_above_200k_tokens": {"type": "number"},
                "input_cost_per_pixel": {"type": "number"},
                "input_cost_per_query": {"type": "number"},
                "input_cost_per_request": {"type": "number"},
@ -483,6 +484,7 @@ def test_aaamodel_prices_and_context_window_json_is_valid():
                "output_cost_per_second": {"type": "number"},
                "output_cost_per_token": {"type": "number"},
                "output_cost_per_token_above_128k_tokens": {"type": "number"},
+                "output_cost_per_token_above_200k_tokens": {"type": "number"},
                "output_cost_per_token_batches": {"type": "number"},
                "output_db_cost_per_token": {"type": "number"},
                "output_dbu_cost_per_token": {"type": "number"},
@ -541,6 +543,13 @@ def test_aaamodel_prices_and_context_window_json_is_valid():
                        "enum": ["text", "audio", "image", "video"],
                    },
                },
+                "supported_output_modalities": {
+                    "type": "array",
+                    "items": {
+                        "type": "string",
+                        "enum": ["text", "image"],
+                    },
+                },
                "supports_native_streaming": {"type": "boolean"},
            },
            "additionalProperties": False,