more progress on auto-generation

This commit is contained in:
Ashwin Bharambe 2024-11-15 09:35:38 -08:00
parent cfa913fdd5
commit e4509cb568
10 changed files with 309 additions and 73 deletions

View file

@ -35,7 +35,7 @@ class VLLMConfig(BaseModel):
)
@classmethod
def sample_dict(cls):
def sample_run_config(cls):
return {
"model": "${env.VLLM_INFERENCE_MODEL:Llama3.2-3B-Instruct}",
"tensor_parallel_size": "${env.VLLM_TENSOR_PARALLEL_SIZE:1}",