diff --git a/llama_stack/providers/inline/inference/vllm/vllm.py b/llama_stack/providers/inline/inference/vllm/vllm.py index 1caae9687..2672c3dbb 100644 --- a/llama_stack/providers/inline/inference/vllm/vllm.py +++ b/llama_stack/providers/inline/inference/vllm/vllm.py @@ -78,7 +78,7 @@ class VLLMInferenceImpl(Inference, ModelsProtocolPrivate): self.engine = AsyncLLMEngine.from_engine_args(engine_args) async def shutdown(self): - """Shutdown the vLLM inference adapter.""" + """Shut down the vLLM inference adapter.""" log.info("Shutting down vLLM inference provider.") if self.engine: self.engine.shutdown_background_loop()