llama-stack/llama_stack/templates/remote-vllm/build.yaml
2024-11-12 12:54:44 -08:00

12 lines
332 B
YAML

name: remote-vllm
distribution_spec:
description: Use (an external) vLLM server for running LLM inference
providers:
inference: remote::vllm
memory:
- inline::faiss
- remote::chromadb
- remote::pgvector
safety: inline::llama-guard
agents: inline::meta-reference
telemetry: inline::meta-reference