version: '2' distribution_spec: description: Use a built-in vLLM engine for running LLM inference providers: inference: - inline::vllm - inline::sentence-transformers vector_io: - inline::faiss - remote::chromadb - remote::pgvector safety: - inline::llama-guard agents: - inline::meta-reference telemetry: - inline::meta-reference datasetio: - remote::huggingface - inline::localfs tool_runtime: - remote::brave-search - remote::tavily-search - inline::code-interpreter - inline::rag-runtime - remote::model-context-protocol image_type: conda