make it work on gpus

2025-07-02 20:40:36 +00:00 · 2025-06-24 12:20:04 -07:00 · 2025-06-24 12:20:04 -07:00 · f99ca37f91
commit f99ca37f91
parent ee96c4891b
7 changed files with 30 additions and 21 deletions
--- a/docs/source/distributions/k8s/stack-k8s.yaml.template
+++ b/docs/source/distributions/k8s/stack-k8s.yaml.template
@ -5,6 +5,7 @@ metadata:
 spec:
  accessModes:
    - ReadWriteOnce
+  storageClassName: gp2
  resources:
    requests:
      storage: 1Gi
@ -25,9 +26,11 @@ spec:
        app.kubernetes.io/name: llama-stack
        app.kubernetes.io/component: server
    spec:
+      nodeSelector:
+        eks.amazonaws.com/nodegroup: cpu
      containers:
      - name: llama-stack
-        image: llamastack/distribution-remote-vllm:latest
+        image: llamastack/distribution-postgres-demo:latest
        imagePullPolicy: Always # since we have specified latest instead of a version
        env:
        - name: ENABLE_CHROMADB