Litellm dev 01 06 2025 p1 (#7594)

* fix(custom_logger.py): expose new 'async_get_chat_completion_prompt' event hook * fix(custom_logger.py): langfuse_prompt_management.py remove 'headers' from custom logger 'async_get_chat_completion_prompt' and 'get_chat_completion_prompt' event hooks * feat(router.py): expose new function for prompt management based routing * feat(router.py): partial working router prompt factory logic allows load balanced model to be used for model name w/ langfuse prompt management call * feat(router.py): fix prompt management with load balanced model group * feat(langfuse_prompt_management.py): support reading in openai params from langfuse enables user to define optional params on langfuse vs. client code * test(test_Router.py): add unit test for router based langfuse prompt management * fix: fix linting errors
2025-04-25 18:54:30 +00:00 · 2025-01-06 21:26:21 -08:00 · 2025-01-06 21:26:21 -08:00 · fef7839e8a
commit fef7839e8a
parent 7133cf5b74
9 changed files with 214 additions and 90 deletions
--- a/litellm/main.py
+++ b/litellm/main.py
@ -79,6 +79,7 @@ from litellm.utils import (
    create_tokenizer,
    get_api_key,
    get_llm_provider,
+    get_non_default_completion_params,
    get_optional_params_embeddings,
    get_optional_params_image_gen,
    get_optional_params_transcription,
@ -881,12 +882,8 @@ def completion(  # type: ignore # noqa: PLR0915
        assistant_continue_message=assistant_continue_message,
    )
    ######## end of unpacking kwargs ###########
-    openai_params = litellm.OPENAI_CHAT_COMPLETION_PARAMS
-    default_params = openai_params + all_litellm_params
+    non_default_params = get_non_default_completion_params(kwargs=kwargs)
    litellm_params = {}  # used to prevent unbound var errors
-    non_default_params = {
-        k: v for k, v in kwargs.items() if k not in default_params
-    }  # model-specific params - pass them straight to the model/provider
    ## PROMPT MANAGEMENT HOOKS ##

    if isinstance(litellm_logging_obj, LiteLLMLoggingObj) and prompt_id is not None:
@ -895,7 +892,6 @@ def completion(  # type: ignore # noqa: PLR0915
                model=model,
                messages=messages,
                non_default_params=non_default_params,
-                headers=headers,
                prompt_id=prompt_id,
                prompt_variables=prompt_variables,
            )