Correct a traceback in vllm

File "/usr/local/lib/python3.10/site-packages/llama_stack/providers/adapters/inference/vllm/vllm.py", line 136, in _stream_chat_completion async for chunk in process_chat_completion_stream_response( TypeError: process_chat_completion_stream_response() takes 2 positional arguments but 3 were given This corrects the error by deleting the requesr variable
2025-12-12 20:12:33 +00:00 · 2024-11-04 17:11:10 -05:00 · 2024-11-04 17:11:10 -05:00 · b6e2526f60
commit b6e2526f60
parent ac93dd89cf
1 changed files with 1 additions and 1 deletions
--- a/llama_stack/providers/adapters/inference/vllm/vllm.py
+++ b/llama_stack/providers/adapters/inference/vllm/vllm.py
@ -134,7 +134,7 @@ class VLLMInferenceAdapter(Inference, ModelsProtocolPrivate):

        stream = _to_async_generator()
        async for chunk in process_chat_completion_stream_response(
-            request, stream, self.formatter
+            stream, self.formatter
        ):
            yield chunk