mirror of
https://github.com/meta-llama/llama-stack.git
synced 2026-01-03 04:42:16 +00:00
template update
This commit is contained in:
parent
f1faa9c924
commit
ac3a65d261
37 changed files with 14 additions and 39 deletions
|
|
@ -1,5 +1,4 @@
|
|||
version: '2'
|
||||
name: meta-reference-quantized-gpu
|
||||
distribution_spec:
|
||||
description: Use Meta Reference with fp8, int4 quantization for running LLM inference
|
||||
providers:
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue