mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-12-03 09:53:45 +00:00
# What does this PR do? Extract API definitions and provider specifications into a standalone llama-stack-api package that can be published to PyPI independently of the main llama-stack server. see: https://github.com/llamastack/llama-stack/pull/2978 and https://github.com/llamastack/llama-stack/pull/2978#issuecomment-3145115942 Motivation External providers currently import from llama-stack, which overrides the installed version and causes dependency conflicts. This separation allows external providers to: - Install only the type definitions they need without server dependencies - Avoid version conflicts with the installed llama-stack package - Be versioned and released independently This enables us to re-enable external provider module tests that were previously blocked by these import conflicts. Changes - Created llama-stack-api package with minimal dependencies (pydantic, jsonschema) - Moved APIs, providers datatypes, strong_typing, and schema_utils - Updated all imports from llama_stack.* to llama_stack_api.* - Configured local editable install for development workflow - Updated linting and type-checking configuration for both packages Next Steps - Publish llama-stack-api to PyPI - Update external provider dependencies - Re-enable external provider module tests Pre-cursor PRs to this one: - #4093 - #3954 - #4064 These PRs moved key pieces _out_ of the Api pkg, limiting the scope of change here. relates to #3237 ## Test Plan Package builds successfully and can be imported independently. All pre-commit hooks pass with expected exclusions maintained. --------- Signed-off-by: Charlie Doern <cdoern@redhat.com>
68 lines
1.8 KiB
Python
Executable file
68 lines
1.8 KiB
Python
Executable file
#!/usr/bin/env python
|
|
# Copyright (c) Meta Platforms, Inc. and affiliates.
|
|
# All rights reserved.
|
|
#
|
|
# This source code is licensed under the terms described in the LICENSE file in
|
|
# the root directory of this source tree.
|
|
|
|
# Run this script:
|
|
# torchrun --nproc_per_node=8 scripts/generate_prompt_format.py meta-llama/Llama-4-17B-Omni-Instruct-BF16-16E ~/.llama/checkpoints/Llama-4-17B-Omni-Instruct-BF16-16E/ llama_stack.models.llama.llama4.prompts llama_stack/models/llama/llama4/prompt_format.md
|
|
|
|
|
|
import importlib
|
|
import os
|
|
from pathlib import Path
|
|
|
|
import fire
|
|
from llama_stack_api import ModelNotFoundError
|
|
|
|
from llama_stack.models.llama.llama3.generation import Llama3
|
|
from llama_stack.models.llama.llama4.generation import Llama4
|
|
from llama_stack.models.llama.sku_list import resolve_model
|
|
|
|
THIS_DIR = Path(__file__).parent.resolve()
|
|
|
|
|
|
def run_main(
|
|
model_id: str,
|
|
checkpoint_dir: str,
|
|
module_name: str,
|
|
output_path: str,
|
|
llama4: bool = True,
|
|
):
|
|
module = importlib.import_module(module_name)
|
|
assert hasattr(module, "usecases"), f"Module {module_name} missing usecases function"
|
|
|
|
llama_model = resolve_model(model_id)
|
|
if not llama_model:
|
|
raise ModelNotFoundError(model_id)
|
|
|
|
cls = Llama4 if llama4 else Llama3
|
|
generator = cls.build(
|
|
ckpt_dir=checkpoint_dir,
|
|
max_seq_len=4096,
|
|
max_batch_size=1,
|
|
)
|
|
|
|
use_cases = module.usecases()
|
|
text = ""
|
|
for u in use_cases:
|
|
if isinstance(u, str):
|
|
use_case_text = f"\n{u}\n"
|
|
else:
|
|
use_case_text = u.to_text(generator)
|
|
|
|
text += use_case_text
|
|
print(use_case_text)
|
|
|
|
os.makedirs(os.path.dirname(output_path), exist_ok=True)
|
|
with open(output_path, "w") as f:
|
|
f.write(text)
|
|
|
|
|
|
def main():
|
|
fire.Fire(run_main)
|
|
|
|
|
|
if __name__ == "__main__":
|
|
main()
|