rename ModelInference to Inference

This commit is contained in:
rsm 2024-07-21 12:19:52 -07:00
parent 245461620d
commit 67f0510edd
18 changed files with 468 additions and 1636 deletions

View file

@ -1,4 +1,4 @@
model_inference_config:
inference_config:
impl_type: "inline"
inline_config:
checkpoint_type: "pytorch"
@ -7,5 +7,5 @@ model_inference_config:
model_parallel_size: 8
max_seq_len: 2048
max_batch_size: 1
quantization:
quantization:
type: "fp8"

View file

@ -1,4 +1,4 @@
model_inference_config:
inference_config:
impl_type: "inline"
inline_config:
checkpoint_type: "pytorch"

View file

@ -1,4 +1,4 @@
model_inference_config:
inference_config:
impl_type: "inline"
inline_config:
checkpoint_type: "pytorch"

View file

@ -1,4 +1,4 @@
model_inference_config:
inference_config:
impl_type: "inline"
inline_config:
checkpoint_type: "pytorch"

View file

@ -1,4 +1,4 @@
model_inference_config:
inference_config:
impl_type: "inline"
inline_config:
checkpoint_type: "pytorch"

View file

@ -1,4 +1,4 @@
model_inference_config:
inference_config:
impl_type: "inline"
inline_config:
checkpoint_type: "pytorch"