New quantized models (#301)

This commit is contained in:
Ashwin Bharambe 2024-10-24 08:38:56 -07:00 committed by GitHub
parent 05a8d47b98
commit 7afe51c84d
No known key found for this signature in database
GPG key ID: B5690EEEBB952194
6 changed files with 292 additions and 21 deletions

View file

@ -37,6 +37,7 @@ def available_providers() -> List[ProviderSpec]:
META_REFERENCE_DEPS
+ [
"fbgemm-gpu",
"torchao==0.5.0",
]
),
module="llama_stack.providers.impls.meta_reference.inference",