mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-06-27 18:50:41 +00:00
New quantized models (#301)
This commit is contained in:
parent
05a8d47b98
commit
7afe51c84d
6 changed files with 292 additions and 21 deletions
|
@ -37,6 +37,7 @@ def available_providers() -> List[ProviderSpec]:
|
|||
META_REFERENCE_DEPS
|
||||
+ [
|
||||
"fbgemm-gpu",
|
||||
"torchao==0.5.0",
|
||||
]
|
||||
),
|
||||
module="llama_stack.providers.impls.meta_reference.inference",
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue