llama-stack-mirror/llama_stack/templates/remote-vllm/build.yaml

12 lines
317 B
YAML

name: remote-vllm
distribution_spec:
description: Use (an external) vLLM server for running LLM inference
providers:
inference: remote::vllm
memory:
- meta-reference
- remote::chromadb
- remote::pgvector
safety: inline::llama-guard
agents: meta-reference
telemetry: meta-reference