fix inference

This commit is contained in:
Xi Yan 2024-09-11 14:51:06 -07:00
parent 96f3058145
commit 2d0163b47b

View file

@ -77,7 +77,8 @@ class MetaReferenceInferenceImpl(Inference):
logprobs=logprobs, logprobs=logprobs,
) )
return self._chat_completion(request) async for chunk in self.chat_completion_impl(request):
yield chunk
async def chat_completion_impl( async def chat_completion_impl(
self, request: ChatCompletionRequest self, request: ChatCompletionRequest