mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-10-14 06:23:45 +00:00
rename ModelInference to Inference
This commit is contained in:
parent
245461620d
commit
67f0510edd
18 changed files with 468 additions and 1636 deletions
|
@ -1,4 +1,4 @@
|
|||
model_inference_config:
|
||||
inference_config:
|
||||
impl_type: "inline"
|
||||
inline_config:
|
||||
checkpoint_type: "pytorch"
|
||||
|
@ -7,5 +7,5 @@ model_inference_config:
|
|||
model_parallel_size: 8
|
||||
max_seq_len: 2048
|
||||
max_batch_size: 1
|
||||
quantization:
|
||||
quantization:
|
||||
type: "fp8"
|
||||
|
|
|
@ -1,4 +1,4 @@
|
|||
model_inference_config:
|
||||
inference_config:
|
||||
impl_type: "inline"
|
||||
inline_config:
|
||||
checkpoint_type: "pytorch"
|
||||
|
|
|
@ -1,4 +1,4 @@
|
|||
model_inference_config:
|
||||
inference_config:
|
||||
impl_type: "inline"
|
||||
inline_config:
|
||||
checkpoint_type: "pytorch"
|
||||
|
|
|
@ -1,4 +1,4 @@
|
|||
model_inference_config:
|
||||
inference_config:
|
||||
impl_type: "inline"
|
||||
inline_config:
|
||||
checkpoint_type: "pytorch"
|
||||
|
|
|
@ -1,4 +1,4 @@
|
|||
model_inference_config:
|
||||
inference_config:
|
||||
impl_type: "inline"
|
||||
inline_config:
|
||||
checkpoint_type: "pytorch"
|
||||
|
|
|
@ -1,4 +1,4 @@
|
|||
model_inference_config:
|
||||
inference_config:
|
||||
impl_type: "inline"
|
||||
inline_config:
|
||||
checkpoint_type: "pytorch"
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue