diff --git a/llama_stack/providers/registry/inference.py b/llama_stack/providers/registry/inference.py index 6cd97fd73..107bf69b2 100644 --- a/llama_stack/providers/registry/inference.py +++ b/llama_stack/providers/registry/inference.py @@ -104,4 +104,13 @@ def available_providers() -> List[ProviderSpec]: config_class="llama_stack.providers.adapters.inference.bedrock.BedrockConfig", ), ), + InlineProviderSpec( + api=Api.inference, + provider_id="vllm", + pip_packages=[ + "vllm", + ], + module="llama_stack.providers.impls.vllm", + config_class="llama_stack.providers.impls.vllm.VLLMConfig", + ), ]