mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-12-31 02:53:52 +00:00
91 lines
3.1 KiB
YAML
91 lines
3.1 KiB
YAML
apiVersion: apps/v1
|
|
kind: Deployment
|
|
metadata:
|
|
name: {{ include "llama-stack.fullname" . }}
|
|
labels:
|
|
{{- include "llama-stack.labels" . | nindent 4 }}
|
|
spec:
|
|
replicas: {{ .Values.replicaCount }}
|
|
selector:
|
|
matchLabels:
|
|
{{- include "llama-stack.selectorLabels" . | nindent 6 }}
|
|
template:
|
|
metadata:
|
|
{{- with .Values.podAnnotations }}
|
|
annotations:
|
|
{{- toYaml . | nindent 8 }}
|
|
{{- end }}
|
|
labels:
|
|
{{- include "llama-stack.labels" . | nindent 8 }}
|
|
{{- with .Values.podLabels }}
|
|
{{- toYaml . | nindent 8 }}
|
|
{{- end }}
|
|
spec:
|
|
{{- with .Values.imagePullSecrets }}
|
|
imagePullSecrets:
|
|
{{- toYaml . | nindent 8 }}
|
|
{{- end }}
|
|
serviceAccountName: {{ include "llama-stack.serviceAccountName" . }}
|
|
securityContext:
|
|
{{- toYaml .Values.podSecurityContext | nindent 8 }}
|
|
containers:
|
|
- name: {{ .Chart.Name }}
|
|
securityContext:
|
|
{{- toYaml .Values.securityContext | nindent 12 }}
|
|
image: "{{ (tpl .Values.image.repository $) }}:{{ .Values.image.tag | default .Chart.AppVersion }}"
|
|
imagePullPolicy: {{ .Values.image.pullPolicy }}
|
|
ports:
|
|
- name: http
|
|
containerPort: {{ .Values.service.port }}
|
|
protocol: TCP
|
|
args:
|
|
- "--yaml-config"
|
|
- "/config/run.yaml"
|
|
env:
|
|
{{- with .Values.vllm }}
|
|
- name: VLLM_URL
|
|
value: {{ .url | quote }}
|
|
- name: VLLM_API_TOKEN
|
|
value: {{ .apiKey | default "" | quote}}
|
|
- name: INFERENCE_MODEL
|
|
value: {{ .inferenceModel | quote }}
|
|
{{- end }}
|
|
- name: LLAMA_STACK_PORT
|
|
value: {{ .Values.service.port | quote }}
|
|
{{- if .Values.telemetry.enabled }}
|
|
- name: TELEMETRY_SINKS
|
|
value: {{ .Values.telemetry.sinks | quote }}
|
|
- name: OTEL_SERVICE_NAME
|
|
value: {{ .Values.telemetry.serviceName | quote }}
|
|
{{- end }}
|
|
{{- with .Values.env }}
|
|
{{- toYaml . | nindent 12 }}
|
|
{{- end }}
|
|
livenessProbe:
|
|
{{- tpl (toYaml .Values.livenessProbe) $ | nindent 12 }}
|
|
readinessProbe:
|
|
{{- tpl (toYaml .Values.readinessProbe) $ | nindent 12 }}
|
|
startupProbe:
|
|
{{- tpl (toYaml .Values.startupProbe) $ | nindent 12 }}
|
|
resources:
|
|
{{- toYaml .Values.resources | nindent 12 }}
|
|
volumeMounts:
|
|
- name: config-volume
|
|
mountPath: /config
|
|
volumes:
|
|
- name: config-volume
|
|
configMap:
|
|
name: {{ include "llama-stack.fullname" . }}-run-config
|
|
defaultMode: 0755
|
|
{{- with .Values.nodeSelector }}
|
|
nodeSelector:
|
|
{{- toYaml . | nindent 8 }}
|
|
{{- end }}
|
|
{{- with .Values.affinity }}
|
|
affinity:
|
|
{{- toYaml . | nindent 8 }}
|
|
{{- end }}
|
|
{{- with .Values.tolerations }}
|
|
tolerations:
|
|
{{- toYaml . | nindent 8 }}
|
|
{{- end }}
|