Support for Llama3.2 models and Swift SDK (#98)

2025-12-04 02:03:44 +00:00 · 2024-09-25 10:29:58 -07:00 · 2024-09-25 10:29:58 -07:00 · 56aed59eb4
commit 56aed59eb4
parent 95abbf576b
56 changed files with 3745 additions and 630 deletions
--- a/llama_stack/cli/model/model.py
+++ b/llama_stack/cli/model/model.py
@ -9,7 +9,7 @@ import argparse
 from llama_stack.cli.model.describe import ModelDescribe
 from llama_stack.cli.model.download import ModelDownload
 from llama_stack.cli.model.list import ModelList
-from llama_stack.cli.model.template import ModelTemplate
+from llama_stack.cli.model.prompt_format import ModelPromptFormat

 from llama_stack.cli.subcommand import Subcommand

@ -30,5 +30,5 @@ class ModelParser(Subcommand):
        # Add sub-commands
        ModelDownload.create(subparsers)
        ModelList.create(subparsers)
-        ModelTemplate.create(subparsers)
+        ModelPromptFormat.create(subparsers)
        ModelDescribe.create(subparsers)
--- a/llama_stack/cli/model/prompt_format.py
+++ b/llama_stack/cli/model/prompt_format.py
@ -0,0 +1,116 @@
+# Copyright (c) Meta Platforms, Inc. and affiliates.
+# All rights reserved.
+#
+# This source code is licensed under the terms described in the LICENSE file in
+# the root directory of this source tree.
+
+import argparse
+import subprocess
+import textwrap
+from io import StringIO
+
+from llama_models.datatypes import CoreModelId, is_multimodal, model_family, ModelFamily
+
+from llama_stack.cli.subcommand import Subcommand
+
+
+class ModelPromptFormat(Subcommand):
+    """Llama model cli for describe a model prompt format (message formats)"""
+
+    def __init__(self, subparsers: argparse._SubParsersAction):
+        super().__init__()
+        self.parser = subparsers.add_parser(
+            "prompt-format",
+            prog="llama model prompt-format",
+            description="Show llama model message formats",
+            epilog=textwrap.dedent(
+                """
+                Example:
+                    llama model prompt-format <options>
+                """
+            ),
+            formatter_class=argparse.RawTextHelpFormatter,
+        )
+        self._add_arguments()
+        self.parser.set_defaults(func=self._run_model_template_cmd)
+
+    def _add_arguments(self):
+        self.parser.add_argument(
+            "-m",
+            "--model-name",
+            type=str,
+            default="llama3_1",
+            help="Model Family (llama3_1, llama3_X, etc.)",
+        )
+
+    def _run_model_template_cmd(self, args: argparse.Namespace) -> None:
+        import pkg_resources
+
+        # Only Llama 3.1 and 3.2 are supported
+        supported_model_ids = [
+            m
+            for m in CoreModelId
+            if model_family(m) in {ModelFamily.llama3_1, ModelFamily.llama3_2}
+        ]
+        model_str = "\n".join([m.value for m in supported_model_ids])
+        try:
+            model_id = CoreModelId(args.model_name)
+        except ValueError:
+            raise argparse.ArgumentTypeError(
+                f"{args.model_name} is not a valid Model. Choose one from --\n{model_str}"
+            ) from None
+
+        if model_id not in supported_model_ids:
+            raise argparse.ArgumentTypeError(
+                f"{model_id} is not a valid Model. Choose one from --\n {model_str}"
+            ) from None
+
+        llama_3_1_file = pkg_resources.resource_filename(
+            "llama_models", "llama3_1/prompt_format.md"
+        )
+        llama_3_2_text_file = pkg_resources.resource_filename(
+            "llama_models", "llama3_2/text_prompt_format.md"
+        )
+        llama_3_2_vision_file = pkg_resources.resource_filename(
+            "llama_models", "llama3_2/vision_prompt_format.md"
+        )
+        if model_family(model_id) == ModelFamily.llama3_1:
+            with open(llama_3_1_file, "r") as f:
+                content = f.read()
+        elif model_family(model_id) == ModelFamily.llama3_2:
+            if is_multimodal(model_id):
+                with open(llama_3_2_vision_file, "r") as f:
+                    content = f.read()
+            else:
+                with open(llama_3_2_text_file, "r") as f:
+                    content = f.read()
+
+        render_markdown_to_pager(content)
+
+
+def render_markdown_to_pager(markdown_content: str):
+    from rich.console import Console
+    from rich.markdown import Markdown
+    from rich.style import Style
+    from rich.text import Text
+
+    class LeftAlignedHeaderMarkdown(Markdown):
+        def parse_header(self, token):
+            level = token.type.count("h")
+            content = Text(token.content)
+            header_style = Style(color="bright_blue", bold=True)
+            header = Text(f"{'#' * level} ", style=header_style) + content
+            self.add_text(header)
+
+    # Render the Markdown
+    md = LeftAlignedHeaderMarkdown(markdown_content)
+
+    # Capture the rendered output
+    output = StringIO()
+    console = Console(file=output, force_terminal=True, width=100)  # Set a fixed width
+    console.print(md)
+    rendered_content = output.getvalue()
+
+    # Pipe to pager
+    pager = subprocess.Popen(["less", "-R"], stdin=subprocess.PIPE)
+    pager.communicate(input=rendered_content.encode())
--- a/llama_stack/cli/model/template.py
+++ b/llama_stack/cli/model/template.py
@ -1,113 +0,0 @@
-# Copyright (c) Meta Platforms, Inc. and affiliates.
-# All rights reserved.
-#
-# This source code is licensed under the terms described in the LICENSE file in
-# the root directory of this source tree.
-
-import argparse
-import textwrap
-
-from termcolor import colored
-
-from llama_stack.cli.subcommand import Subcommand
-
-
-class ModelTemplate(Subcommand):
-    """Llama model cli for describe a model template (message formats)"""
-
-    def __init__(self, subparsers: argparse._SubParsersAction):
-        super().__init__()
-        self.parser = subparsers.add_parser(
-            "template",
-            prog="llama model template",
-            description="Show llama model message formats",
-            epilog=textwrap.dedent(
-                """
-                Example:
-                    llama model template <options>
-                """
-            ),
-            formatter_class=argparse.RawTextHelpFormatter,
-        )
-        self._add_arguments()
-        self.parser.set_defaults(func=self._run_model_template_cmd)
-
-    def _prompt_type(self, value):
-        from llama_models.llama3.api.datatypes import ToolPromptFormat
-
-        try:
-            return ToolPromptFormat(value.lower())
-        except ValueError:
-            raise argparse.ArgumentTypeError(
-                f"{value} is not a valid ToolPromptFormat. Choose from {', '.join(t.value for t in ToolPromptFormat)}"
-            ) from None
-
-    def _add_arguments(self):
-        self.parser.add_argument(
-            "-m",
-            "--model-family",
-            type=str,
-            default="llama3_1",
-            help="Model Family (llama3_1, llama3_X, etc.)",
-        )
-        self.parser.add_argument(
-            "--name",
-            type=str,
-            help="Usecase template name (system_message, user_message, assistant_message, tool_message)...",
-            required=False,
-        )
-        self.parser.add_argument(
-            "--format",
-            type=str,
-            help="ToolPromptFormat (json or function_tag). This flag is used to print the template in a specific formats.",
-            required=False,
-            default="json",
-        )
-        self.parser.add_argument(
-            "--raw",
-            action="store_true",
-            help="If set to true, don't pretty-print into a table. Useful to copy-paste.",
-        )
-
-    def _run_model_template_cmd(self, args: argparse.Namespace) -> None:
-        from llama_models.llama3.api.interface import (
-            list_jinja_templates,
-            render_jinja_template,
-        )
-
-        from llama_stack.cli.table import print_table
-
-        if args.name:
-            tool_prompt_format = self._prompt_type(args.format)
-            template, tokens_info = render_jinja_template(args.name, tool_prompt_format)
-            rendered = ""
-            for tok, is_special in tokens_info:
-                if is_special:
-                    rendered += colored(tok, "yellow", attrs=["bold"])
-                else:
-                    rendered += tok
-
-            if not args.raw:
-                rendered = rendered.replace("\n", "↵\n")
-                print_table(
-                    [
-                        (
-                            "Name",
-                            colored(template.template_name, "white", attrs=["bold"]),
-                        ),
-                        ("Template", rendered),
-                        ("Notes", template.notes),
-                    ],
-                    separate_rows=True,
-                )
-            else:
-                print("Template: ", template.template_name)
-                print("=" * 40)
-                print(rendered)
-        else:
-            templates = list_jinja_templates()
-            headers = ["Role", "Template Name"]
-            print_table(
-                [(t.role, t.template_name) for t in templates],
-                headers,
-            )