forked from phoenix-oss/llama-stack-mirror
Add vLLM inference provider for OpenAI compatible vLLM server (#178)
This PR adds vLLM inference provider for OpenAI compatible vLLM server.
This commit is contained in:
parent
59c43736e8
commit
a27a2cd2af
6 changed files with 209 additions and 1 deletions
|
@ -7,4 +7,4 @@ distribution_spec:
|
|||
safety: meta-reference
|
||||
agents: meta-reference
|
||||
telemetry: meta-reference
|
||||
image_type: conda
|
||||
image_type: conda
|
10
llama_stack/distribution/templates/remote-vllm-build.yaml
Normal file
10
llama_stack/distribution/templates/remote-vllm-build.yaml
Normal file
|
@ -0,0 +1,10 @@
|
|||
name: remote-vllm
|
||||
distribution_spec:
|
||||
description: Use remote vLLM for running LLM inference
|
||||
providers:
|
||||
inference: remote::vllm
|
||||
memory: meta-reference
|
||||
safety: meta-reference
|
||||
agents: meta-reference
|
||||
telemetry: meta-reference
|
||||
image_type: docker
|
Loading…
Add table
Add a link
Reference in a new issue