mirror of
https://github.com/meta-llama/llama-stack.git
synced 2025-07-29 15:23:51 +00:00
fix inference
This commit is contained in:
parent
96f3058145
commit
2d0163b47b
1 changed files with 2 additions and 1 deletions
|
@ -77,7 +77,8 @@ class MetaReferenceInferenceImpl(Inference):
|
||||||
logprobs=logprobs,
|
logprobs=logprobs,
|
||||||
)
|
)
|
||||||
|
|
||||||
return self._chat_completion(request)
|
async for chunk in self.chat_completion_impl(request):
|
||||||
|
yield chunk
|
||||||
|
|
||||||
async def chat_completion_impl(
|
async def chat_completion_impl(
|
||||||
self, request: ChatCompletionRequest
|
self, request: ChatCompletionRequest
|
||||||
|
|
Loading…
Add table
Add a link
Reference in a new issue