Pod -> Deployment, NodePort -> ClusterIP

Signed-off-by: Yuan Tang <terrytangyuan@gmail.com>
This commit is contained in:
Yuan Tang 2025-01-29 21:32:22 -05:00
parent abad607bf8
commit ddba43fada
No known key found for this signature in database

View file

@ -32,13 +32,20 @@ type: Opaque
data: data:
token: "<YOUR-HF-TOKEN>" token: "<YOUR-HF-TOKEN>"
--- ---
apiVersion: v1 apiVersion: apps/v1
kind: Pod kind: Deployment
metadata: metadata:
name: vllm-server name: vllm-server
labels:
app: vllm
spec: spec:
replicas: 1
selector:
matchLabels:
app.kubernetes.io/name: vllm
template:
metadata:
labels:
app.kubernetes.io/name: vllm
spec:
containers: containers:
- name: llama-stack - name: llama-stack
image: <VLLM-IMAGE> image: <VLLM-IMAGE>
@ -73,11 +80,12 @@ metadata:
name: vllm-server name: vllm-server
spec: spec:
selector: selector:
app: vllm app.kubernetes.io/name: vllm
ports: ports:
- port: 8000 - protocol: TCP
port: 8000
targetPort: 8000 targetPort: 8000
type: NodePort type: ClusterIP
EOF EOF
``` ```
@ -135,13 +143,20 @@ spec:
requests: requests:
storage: 1Gi storage: 1Gi
--- ---
apiVersion: v1 apiVersion: apps/v1
kind: Pod kind: Deployment
metadata: metadata:
name: llama-stack-pod name: llama-stack-server
labels:
app: llama-stack
spec: spec:
replicas: 1
selector:
matchLabels:
app.kubernetes.io/name: llama-stack
template:
metadata:
labels:
app.kubernetes.io/name: llama-stack
spec:
containers: containers:
- name: llama-stack - name: llama-stack
image: localhost/llama-stack-run-k8s:latest image: localhost/llama-stack-run-k8s:latest
@ -163,7 +178,7 @@ metadata:
name: llama-stack-service name: llama-stack-service
spec: spec:
selector: selector:
app: llama-stack app.kubernetes.io/name: llama-stack
ports: ports:
- protocol: TCP - protocol: TCP
port: 5000 port: 5000