mirror of
https://github.com/meta-llama/llama-stack.git
synced 2026-01-04 18:42:18 +00:00
Fix issue when generating vLLM distros
Signed-off-by: Yuan Tang <terrytangyuan@gmail.com>
This commit is contained in:
parent
89e3f81520
commit
7c726826b8
3 changed files with 14 additions and 46 deletions
|
|
@ -134,7 +134,7 @@ def get_distribution_template() -> DistributionTemplate:
|
|||
"Inference model loaded into the vLLM server",
|
||||
),
|
||||
"VLLM_URL": (
|
||||
"http://host.docker.internal:5100}/v1",
|
||||
"http://host.docker.internal:5100/v1",
|
||||
"URL of the vLLM server with the main inference model",
|
||||
),
|
||||
"MAX_TOKENS": (
|
||||
|
|
|
|||
Loading…
Add table
Add a link
Reference in a new issue