Merge branch 'meta-llama:main' into preprocessors

This commit is contained in:
Ilya Kolchinsky 2025-04-07 12:03:11 +02:00 committed by GitHub
commit 3941d083ea
No known key found for this signature in database
GPG key ID: B5690EEEBB952194
71 changed files with 206623 additions and 6480 deletions

View file

@ -39,13 +39,7 @@ def available_providers() -> List[ProviderSpec]:
InlineProviderSpec(
api=Api.inference,
provider_type="inline::meta-reference-quantized",
pip_packages=(
META_REFERENCE_DEPS
+ [
"fbgemm-gpu",
"torchao==0.5.0",
]
),
pip_packages=META_REFERENCE_DEPS + ["fbgemm-gpu", "torchao==0.5.0"],
module="llama_stack.providers.inline.inference.meta_reference",
config_class="llama_stack.providers.inline.inference.meta_reference.MetaReferenceQuantizedInferenceConfig",
),