mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-07-18 19:02:30 +00:00
split off safety so it can be applied one at a time
This commit is contained in:
parent
d93f6c9e5b
commit
4121166784
5 changed files with 62 additions and 65 deletions
|
@ -29,8 +29,12 @@ spec:
|
|||
image: llamastack/distribution-remote-vllm:latest
|
||||
imagePullPolicy: Always # since we have specified latest instead of a version
|
||||
env:
|
||||
- name: ENABLE_CHROMADB
|
||||
value: "true"
|
||||
- name: VLLM_URL
|
||||
value: http://vllm-server.default.svc.cluster.local:8000/v1
|
||||
- name: VLLM_MAX_TOKENS
|
||||
value: "3072"
|
||||
- name: VLLM_SAFETY_URL
|
||||
value: http://vllm-server-safety.default.svc.cluster.local:8001/v1
|
||||
- name: POSTGRES_HOST
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue