fix: Make remote::vllm compatible with vLLM <= v0.6.3

Signed-off-by: Yuan Tang <terrytangyuan@gmail.com>
2026-01-07 10:10:02 +00:00 · 2025-02-28 11:56:17 -05:00 · 2025-02-28 11:56:17 -05:00 · d6204b072f
commit d6204b072f
parent 7f9b767277
1 changed files with 6 additions and 0 deletions
--- a/llama_stack/providers/remote/inference/vllm/vllm.py
+++ b/llama_stack/providers/remote/inference/vllm/vllm.py
@ -270,6 +270,12 @@ class VLLMInferenceAdapter(Inference, ModelsProtocolPrivate):
        tool_config: Optional[ToolConfig] = None,
    ) -> AsyncGenerator:
        model = await self.model_store.get_model(model_id)
+        # This is to be consistent with OpenAI API and support vLLM <= v0.6.3
+        # References:
+        #   * https://platform.openai.com/docs/api-reference/chat/create#chat-create-tool_choice
+        #   * https://github.com/vllm-project/vllm/pull/10000
+        if (tools is None or len(tools) == 0) and tool_config is not None:
+            tool_config.tool_choice = ToolChoice.none
        request = ChatCompletionRequest(
            model=model.provider_resource_id,
            messages=messages,