diff --git a/src/llama_stack/core/server/server.py b/src/llama_stack/core/server/server.py index 0d3513980..4c391d7f1 100644 --- a/src/llama_stack/core/server/server.py +++ b/src/llama_stack/core/server/server.py @@ -205,7 +205,11 @@ async def sse_generator(event_gen_coroutine): except asyncio.CancelledError: logger.info("Generator cancelled") if event_gen: - await event_gen.aclose() + # Some generators (like OpenAI's AsyncStream) only have close() + if hasattr(event_gen, "aclose"): + await event_gen.aclose() + elif hasattr(event_gen, "close"): + await event_gen.close() except Exception as e: logger.exception("Error in sse_generator") yield create_sse_event(