Merge branch 'main' into add-watsonx-inference-adapter

2025-12-29 10:02:20 +00:00 · 2025-04-06 16:28:39 +05:30 · 2025-04-06 16:28:39 +05:30 · 8cf8bd35f8
commit 8cf8bd35f8
parent 7eb83264ef 3f92b2bf85
141 changed files with 206076 additions and 6917 deletions
--- a/llama_stack/providers/registry/inference.py
+++ b/llama_stack/providers/registry/inference.py
@ -39,13 +39,7 @@ def available_providers() -> List[ProviderSpec]:
        InlineProviderSpec(
            api=Api.inference,
            provider_type="inline::meta-reference-quantized",
-            pip_packages=(
-                META_REFERENCE_DEPS
-                + [
-                    "fbgemm-gpu",
-                    "torchao==0.5.0",
-                ]
-            ),
+            pip_packages=META_REFERENCE_DEPS + ["fbgemm-gpu", "torchao==0.5.0"],
            module="llama_stack.providers.inline.inference.meta_reference",
            config_class="llama_stack.providers.inline.inference.meta_reference.MetaReferenceQuantizedInferenceConfig",
        ),