more fixes, gah

This commit is contained in:
Ashwin Bharambe 2025-06-01 17:07:18 -07:00
parent 6f4f51f8d9
commit 6cbb3366f2
3 changed files with 16 additions and 1 deletions

View file

@ -57,3 +57,16 @@ spec:
- name: llama-storage
persistentVolumeClaim:
claimName: vllm-models
---
apiVersion: v1
kind: Service
metadata:
name: vllm-server
spec:
selector:
app.kubernetes.io/name: vllm
ports:
- protocol: TCP
port: 8000
targetPort: 8000
type: ClusterIP