mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-06-28 19:04:19 +00:00
add /inference/chat_completion to SSE special case
This commit is contained in:
parent
4f021de10f
commit
2b63074676
3 changed files with 31 additions and 28 deletions
|
@ -35,7 +35,10 @@ from llama_toolchain.stack import LlamaStack
|
|||
|
||||
|
||||
# TODO: this should be fixed in the generator itself so it reads appropriate annotations
|
||||
STREAMING_ENDPOINTS = ["/agentic_system/turn/create"]
|
||||
STREAMING_ENDPOINTS = [
|
||||
"/agentic_system/turn/create",
|
||||
"/inference/chat_completion",
|
||||
]
|
||||
|
||||
|
||||
def patch_sse_stream_responses(spec: Specification):
|
||||
|
|
Loading…
Add table
Add a link
Reference in a new issue