update batch completion endpoint

This commit is contained in:
Ashwin Bharambe 2024-07-22 16:08:28 -07:00
parent 1e573843ce
commit 9b51b4edd8
2 changed files with 31 additions and 2 deletions

View file

@ -108,10 +108,10 @@ class Inference(Protocol):
async def batch_completion(
self,
request: BatchCompletionRequest,
) -> List[CompletionResponse]: ...
) -> BatchCompletionResponse: ...
@webmethod(route="/inference/batch_chat_completion")
async def batch_chat_completion(
self,
request: BatchChatCompletionRequest,
) -> List[ChatCompletionResponse]: ...
) -> BatchChatCompletionResponse: ...