fixes and linting

2026-01-07 01:19:56 +00:00 · 2025-03-28 18:33:36 -07:00 · 2025-03-28 18:33:36 -07:00 · 5251d2422d
commit 5251d2422d
parent 021dd0d35d
8 changed files with 149 additions and 345 deletions
--- a/llama_stack/providers/utils/inference/prompt_adapter.py
+++ b/llama_stack/providers/utils/inference/prompt_adapter.py
@ -12,6 +12,7 @@ import re
 from typing import List, Optional, Tuple, Union

 import httpx
+from PIL import Image as PIL_Image

 from llama_stack.apis.common.content_types import (
    ImageContentItem,
@ -33,7 +34,6 @@ from llama_stack.apis.inference import (
 )
 from llama_stack.log import get_logger
 from llama_stack.models.llama.datatypes import (
-    is_multimodal,
    ModelFamily,
    RawContent,
    RawContentItem,
@ -43,6 +43,7 @@ from llama_stack.models.llama.datatypes import (
    Role,
    StopReason,
    ToolPromptFormat,
+    is_multimodal,
 )
 from llama_stack.models.llama.llama3.chat_format import ChatFormat
 from llama_stack.models.llama.llama3.prompt_templates import (
@ -55,7 +56,6 @@ from llama_stack.models.llama.llama3.prompt_templates import (
 from llama_stack.models.llama.llama3.tokenizer import Tokenizer
 from llama_stack.models.llama.sku_list import resolve_model
 from llama_stack.providers.utils.inference import supported_inference_models
-from PIL import Image as PIL_Image

 log = get_logger(name=__name__, category="inference")

@ -129,9 +129,7 @@ async def interleaved_content_convert_to_raw(
                if image.url.uri.startswith("data"):
                    match = re.match(r"data:image/(\w+);base64,(.+)", image.url.uri)
                    if not match:
-                        raise ValueError(
-                            f"Invalid data URL format, {image.url.uri[:40]}..."
-                        )
+                        raise ValueError(f"Invalid data URL format, {image.url.uri[:40]}...")
                    _, image_data = match.groups()
                    data = base64.b64decode(image_data)
                elif image.url.uri.startswith("file://"):
@ -211,17 +209,13 @@ async def convert_image_content_to_url(

    content, format = await localize_image_content(media)
    if include_format:
-        return f"data:image/{format};base64," + base64.b64encode(content).decode(
-            "utf-8"
-        )
+        return f"data:image/{format};base64," + base64.b64encode(content).decode("utf-8")
    else:
        return base64.b64encode(content).decode("utf-8")


 async def completion_request_to_prompt(request: CompletionRequest) -> str:
-    content = augment_content_with_response_format_prompt(
-        request.response_format, request.content
-    )
+    content = augment_content_with_response_format_prompt(request.response_format, request.content)
    request.content = content
    request = await convert_request_to_raw(request)

@ -233,9 +227,7 @@ async def completion_request_to_prompt(request: CompletionRequest) -> str:
 async def completion_request_to_prompt_model_input_info(
    request: CompletionRequest,
 ) -> Tuple[str, int]:
-    content = augment_content_with_response_format_prompt(
-        request.response_format, request.content
-    )
+    content = augment_content_with_response_format_prompt(request.response_format, request.content)
    request.content = content
    request = await convert_request_to_raw(request)

@ -256,9 +248,7 @@ def augment_content_with_response_format_prompt(response_format, content):
    return content


-async def chat_completion_request_to_prompt(
-    request: ChatCompletionRequest, llama_model: str
-) -> str:
+async def chat_completion_request_to_prompt(request: ChatCompletionRequest, llama_model: str) -> str:
    messages = chat_completion_request_to_messages(request, llama_model)
    request.messages = messages
    request = await convert_request_to_raw(request)
@ -266,8 +256,7 @@ async def chat_completion_request_to_prompt(
    formatter = ChatFormat(tokenizer=Tokenizer.get_instance())
    model_input = formatter.encode_dialog_prompt(
        request.messages,
-        tool_prompt_format=request.tool_config.tool_prompt_format
-        or get_default_tool_prompt_format(llama_model),
+        tool_prompt_format=request.tool_config.tool_prompt_format or get_default_tool_prompt_format(llama_model),
    )
    return formatter.tokenizer.decode(model_input.tokens)

@ -282,8 +271,7 @@ async def chat_completion_request_to_model_input_info(
    formatter = ChatFormat(tokenizer=Tokenizer.get_instance())
    model_input = formatter.encode_dialog_prompt(
        request.messages,
-        tool_prompt_format=request.tool_config.tool_prompt_format
-        or get_default_tool_prompt_format(llama_model),
+        tool_prompt_format=request.tool_config.tool_prompt_format or get_default_tool_prompt_format(llama_model),
    )
    tokens = []
    for t in model_input.tokens:
@ -318,8 +306,7 @@ def chat_completion_request_to_messages(
        return request.messages

    if model.model_family == ModelFamily.llama3_1 or (
-        model.model_family == ModelFamily.llama3_2
-        and is_multimodal(model.core_model_id)
+        model.model_family == ModelFamily.llama3_2 and is_multimodal(model.core_model_id)
    ):
        # llama3.1 and llama3.2 multimodal models follow the same tool prompt format
        messages = augment_messages_for_tools_llama_3_1(request)
@ -355,9 +342,7 @@ def augment_messages_for_tools_llama_3_1(
    if existing_messages[0].role == Role.system.value:
        existing_system_message = existing_messages.pop(0)

-    assert (
-        existing_messages[0].role != Role.system.value
-    ), "Should only have 1 system message"
+    assert existing_messages[0].role != Role.system.value, "Should only have 1 system message"

    messages = []

@ -389,13 +374,9 @@ def augment_messages_for_tools_llama_3_1(
        if isinstance(existing_system_message.content, str):
            sys_content += _process(existing_system_message.content)
        elif isinstance(existing_system_message.content, list):
-            sys_content += "\n".join(
-                [_process(c) for c in existing_system_message.content]
-            )
+            sys_content += "\n".join([_process(c) for c in existing_system_message.content])

-    tool_choice_prompt = _get_tool_choice_prompt(
-        request.tool_config.tool_choice, request.tools
-    )
+    tool_choice_prompt = _get_tool_choice_prompt(request.tool_config.tool_choice, request.tools)
    if tool_choice_prompt:
        sys_content += "\n" + tool_choice_prompt

@ -429,9 +410,7 @@ def augment_messages_for_tools_llama_3_2(
    if existing_messages[0].role == Role.system.value:
        existing_system_message = existing_messages.pop(0)

-    assert (
-        existing_messages[0].role != Role.system.value
-    ), "Should only have 1 system message"
+    assert existing_messages[0].role != Role.system.value, "Should only have 1 system message"

    sys_content = ""
    custom_tools, builtin_tools = [], []
@ -452,16 +431,10 @@ def augment_messages_for_tools_llama_3_2(
    if custom_tools:
        fmt = request.tool_config.tool_prompt_format or ToolPromptFormat.python_list
        if fmt != ToolPromptFormat.python_list:
-            raise ValueError(
-                f"Non supported ToolPromptFormat {request.tool_config.tool_prompt_format}"
-            )
+            raise ValueError(f"Non supported ToolPromptFormat {request.tool_config.tool_prompt_format}")

        system_prompt = None
-        if (
-            existing_system_message
-            and request.tool_config.system_message_behavior
-            == SystemMessageBehavior.replace
-        ):
+        if existing_system_message and request.tool_config.system_message_behavior == SystemMessageBehavior.replace:
            system_prompt = existing_system_message.content

        tool_template = PythonListCustomToolGenerator().gen(custom_tools, system_prompt)
@ -470,16 +443,11 @@ def augment_messages_for_tools_llama_3_2(
        sys_content += "\n"

    if existing_system_message and (
-        request.tool_config.system_message_behavior == SystemMessageBehavior.append
-        or not custom_tools
+        request.tool_config.system_message_behavior == SystemMessageBehavior.append or not custom_tools
    ):
-        sys_content += interleaved_content_as_str(
-            existing_system_message.content, sep="\n"
-        )
+        sys_content += interleaved_content_as_str(existing_system_message.content, sep="\n")

-    tool_choice_prompt = _get_tool_choice_prompt(
-        request.tool_config.tool_choice, request.tools
-    )
+    tool_choice_prompt = _get_tool_choice_prompt(request.tool_config.tool_choice, request.tools)
    if tool_choice_prompt:
        sys_content += "\n" + tool_choice_prompt

@ -487,15 +455,11 @@ def augment_messages_for_tools_llama_3_2(
    return messages


-def _get_tool_choice_prompt(
-    tool_choice: ToolChoice | str, tools: List[ToolDefinition]
-) -> str:
+def _get_tool_choice_prompt(tool_choice: ToolChoice | str, tools: List[ToolDefinition]) -> str:
    if tool_choice == ToolChoice.auto:
        return ""
    elif tool_choice == ToolChoice.required:
-        return (
-            "You MUST use one of the provided functions/tools to answer the user query."
-        )
+        return "You MUST use one of the provided functions/tools to answer the user query."
    elif tool_choice == ToolChoice.none:
        # tools are already not passed in
        return ""
@ -507,14 +471,11 @@ def _get_tool_choice_prompt(
 def get_default_tool_prompt_format(model: str) -> ToolPromptFormat:
    llama_model = resolve_model(model)
    if llama_model is None:
-        log.warning(
-            f"Could not resolve model {model}, defaulting to json tool prompt format"
-        )
+        log.warning(f"Could not resolve model {model}, defaulting to json tool prompt format")
        return ToolPromptFormat.json

    if llama_model.model_family == ModelFamily.llama3_1 or (
-        llama_model.model_family == ModelFamily.llama3_2
-        and is_multimodal(llama_model.core_model_id)
+        llama_model.model_family == ModelFamily.llama3_2 and is_multimodal(llama_model.core_model_id)
    ):
        # llama3.1 and llama3.2 multimodal models follow the same tool prompt format
        return ToolPromptFormat.json