Merge pull request #3751 from BerriAI/litellm_router_abatch_completion_one_model

[FEAT] - add litellm.Router - `abatch_completion_one_model_multiple_requests`
2024-05-20 18:42:54 -07:00 · 2024-05-20 18:42:54 -07:00 · e8a3916d46
commit e8a3916d46
parent 829ca84f07 92a4df00d4
1 changed files with 49 additions and 0 deletions
--- a/litellm/router.py
+++ b/litellm/router.py
@ -662,6 +662,10 @@ class Router:
    async def abatch_completion(
        self, models: List[str], messages: List[Dict[str, str]], **kwargs
    ):
        """
        Async Batch Completion - Batch Process 1 request to multiple model_group on litellm.Router
        Use this for sending the same request to N models
        """
        async def _async_completion_no_exceptions(
            model: str, messages: List[Dict[str, str]], **kwargs
@ -686,6 +690,51 @@ class Router:
        response = await asyncio.gather(*_tasks)
        return response
    async def abatch_completion_one_model_multiple_requests(
        self, model: str, messages: List[List[Dict[str, str]]], **kwargs
    ):
        """
        Async Batch Completion - Batch Process multiple Messages to one model_group on litellm.Router
        Use this for sending multiple requests to 1 model
        Args:
            model (List[str]): model group
            messages (List[List[Dict[str, str]]]): list of messages. Each element in the list is one request
            **kwargs: additional kwargs
        Usage:
            response = await self.abatch_completion_one_model_multiple_requests(
                model="gpt-3.5-turbo",
                messages=[
                    [{"role": "user", "content": "hello"}, {"role": "user", "content": "tell me something funny"}],
                    [{"role": "user", "content": "hello good mornign"}],
                ]
            )
        """
        async def _async_completion_no_exceptions(
            model: str, messages: List[Dict[str, str]], **kwargs
        ):
            """
            Wrapper around self.async_completion that catches exceptions and returns them as a result
            """
            try:
                return await self.acompletion(model=model, messages=messages, **kwargs)
            except Exception as e:
                return e
        _tasks = []
        for message_request in messages:
            # add each task but if the task fails
            _tasks.append(
                _async_completion_no_exceptions(
                    model=model, messages=message_request, **kwargs
                )
            )
        response = await asyncio.gather(*_tasks)
        return response
    def image_generation(self, prompt: str, model: str, **kwargs):
        try:
            kwargs["model"] = model