add NIM k8s solution

This commit is contained in:
Kai Wu 2025-07-29 09:01:21 -07:00
parent 95d25ddfe2
commit 8c0f328cbc
4 changed files with 133 additions and 128 deletions

View file

@ -45,6 +45,8 @@ spec:
value: http://vllm-server.default.svc.cluster.local:8000/v1
- name: VLLM_MAX_TOKENS
value: "3072"
- name: NVIDIA_BASE_URL
value: http://llama-nano-nim.default.svc.cluster.local:8000/v1
- name: VLLM_SAFETY_URL
value: http://vllm-server-safety.default.svc.cluster.local:8001/v1
- name: POSTGRES_HOST