fix(o_series_transformation.py): fix optional param check for o-serie… (#8787)

* fix(o_series_transformation.py): fix optional param check for o-series models o3-mini and o-1 do not support parallel tool calling * fix(utils.py): support 'drop_params' for 'thinking' param across models allows switching to older claude versions (or non-anthropic models) and param to be safely dropped * fix: fix passing thinking param in optional params allows dropping thinking_param where not applicable * test: update old model * fix(utils.py): fix linting errors * fix(main.py): add param to acompletion
2025-04-25 02:34:29 +00:00 · 2025-02-26 12:26:55 -08:00 · 2025-02-26 12:26:55 -08:00 · 017c482d7b
commit 017c482d7b
parent aabb5c0df4
11 changed files with 87 additions and 31 deletions
--- a/litellm/main.py
+++ b/litellm/main.py
@ -166,6 +166,7 @@ from .llms.vertex_ai.vertex_model_garden.main import VertexAIModelGardenModels
 from .llms.vllm.completion import handler as vllm_handler
 from .llms.watsonx.chat.handler import WatsonXChatHandler
 from .llms.watsonx.common_utils import IBMWatsonXMixin
+from .types.llms.anthropic import AnthropicThinkingParam
 from .types.llms.openai import (
    ChatCompletionAssistantMessage,
    ChatCompletionAudioParam,
@ -341,6 +342,7 @@ async def acompletion(
    model_list: Optional[list] = None,  # pass in a list of api_base,keys, etc.
    extra_headers: Optional[dict] = None,
    # Optional liteLLM function params
+    thinking: Optional[AnthropicThinkingParam] = None,
    **kwargs,
 ) -> Union[ModelResponse, CustomStreamWrapper]:
    """
@ -800,6 +802,7 @@ def completion(  # type: ignore # noqa: PLR0915
    api_key: Optional[str] = None,
    model_list: Optional[list] = None,  # pass in a list of api_base,keys, etc.
    # Optional liteLLM function params
+    thinking: Optional[AnthropicThinkingParam] = None,
    **kwargs,
 ) -> Union[ModelResponse, CustomStreamWrapper]:
    """
@ -1106,6 +1109,7 @@ def completion(  # type: ignore # noqa: PLR0915
            parallel_tool_calls=parallel_tool_calls,
            messages=messages,
            reasoning_effort=reasoning_effort,
+            thinking=thinking,
            **non_default_params,
        )