mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-08-02 08:44:44 +00:00
add NIM k8s solution
This commit is contained in:
parent
95d25ddfe2
commit
8c0f328cbc
4 changed files with 133 additions and 128 deletions
|
@ -45,6 +45,8 @@ spec:
|
|||
value: http://vllm-server.default.svc.cluster.local:8000/v1
|
||||
- name: VLLM_MAX_TOKENS
|
||||
value: "3072"
|
||||
- name: NVIDIA_BASE_URL
|
||||
value: http://llama-nano-nim.default.svc.cluster.local:8000/v1
|
||||
- name: VLLM_SAFETY_URL
|
||||
value: http://vllm-server-safety.default.svc.cluster.local:8001/v1
|
||||
- name: POSTGRES_HOST
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue