Fix completion_tokens on Vertex AI Gemini thinking models

2025-04-25 02:34:29 +00:00 · 2025-04-21 08:57:12 -05:00 · 2025-04-21 08:57:12 -05:00 · f87f500a49
commit f87f500a49
parent 62ed5b2f78
1 changed files with 9 additions and 3 deletions
--- a/litellm/llms/vertex_ai/gemini/vertex_and_google_ai_studio_gemini.py
+++ b/litellm/llms/vertex_ai/gemini/vertex_and_google_ai_studio_gemini.py
@ -766,14 +766,20 @@ class VertexGeminiConfig(VertexAIBaseConfig, BaseConfig):
            audio_tokens=audio_tokens,
            text_tokens=text_tokens,
        )
+        completion_tokens = completion_response["usageMetadata"].get(
+            "candidatesTokenCount", 0
+        )
+        if reasoning_tokens:
+            # Usage(...) constructor expects that completion_tokens includes the reasoning_tokens.
+            # However the Vertex AI usage metadata does not include reasoning tokens in candidatesTokenCount.
+            # Reportedly, this is different from the Gemini API.
+            completion_tokens += reasoning_tokens
        ## GET USAGE ##
        usage = Usage(
            prompt_tokens=completion_response["usageMetadata"].get(
                "promptTokenCount", 0
            ),
-            completion_tokens=completion_response["usageMetadata"].get(
-                "candidatesTokenCount", 0
-            ),
+            completion_tokens=completion_tokens,
            total_tokens=completion_response["usageMetadata"].get("totalTokenCount", 0),
            prompt_tokens_details=prompt_tokens_details,
            reasoning_tokens=reasoning_tokens,