Add a meta-reference-quantized-gpu distribution

This commit is contained in:
Ashwin Bharambe 2024-10-23 19:33:14 -07:00
parent f5dcc03742
commit 05a8d47b98
6 changed files with 104 additions and 4 deletions

View file

@ -36,7 +36,7 @@ def available_providers() -> List[ProviderSpec]:
pip_packages=(
META_REFERENCE_DEPS
+ [
"fbgemm-gpu==0.8.0",
"fbgemm-gpu",
]
),
module="llama_stack.providers.impls.meta_reference.inference",