(fix) add linting check to ban creating AsyncHTTPHandler during LLM calling (#6855)

* fix triton * fix TEXT_COMPLETION_CODESTRAL * fix REPLICATE * fix CLARIFAI * fix HUGGINGFACE * add test_no_async_http_handler_usage * fix PREDIBASE * fix anthropic use get_async_httpx_client * fix vertex fine tuning * fix dbricks get_async_httpx_client * fix get_async_httpx_client vertex * fix get_async_httpx_client * fix get_async_httpx_client * fix make_async_azure_httpx_request * fix check_for_async_http_handler * test: cleanup mistral model * add check for AsyncClient * fix check_for_async_http_handler * fix get_async_httpx_client * fix tests using in_memory_llm_clients_cache * fix langfuse import * fix import --------- Co-authored-by: Krrish Dholakia <krrishdholakia@gmail.com>
2025-04-26 19:24:27 +00:00 · 2024-11-21 19:03:02 -08:00 · 2024-11-21 19:03:02 -08:00 · aa6b133557
commit aa6b133557
parent 7c595e770c
26 changed files with 288 additions and 62 deletions
--- a/litellm/llms/text_completion_codestral.py
+++ b/litellm/llms/text_completion_codestral.py
@ -18,7 +18,10 @@ import litellm
 from litellm import verbose_logger
 from litellm.litellm_core_utils.core_helpers import map_finish_reason
 from litellm.litellm_core_utils.litellm_logging import Logging as LiteLLMLogging
-from litellm.llms.custom_httpx.http_handler import AsyncHTTPHandler
+from litellm.llms.custom_httpx.http_handler import (
+    AsyncHTTPHandler,
+    get_async_httpx_client,
+)
 from litellm.types.llms.databricks import GenericStreamingChunk
 from litellm.utils import (
    Choices,
@ -479,8 +482,9 @@ class CodestralTextCompletion(BaseLLM):
        headers={},
    ) -> TextCompletionResponse:

-        async_handler = AsyncHTTPHandler(
-            timeout=httpx.Timeout(timeout=timeout), concurrent_limit=1
+        async_handler = get_async_httpx_client(
+            llm_provider=litellm.LlmProviders.TEXT_COMPLETION_CODESTRAL,
+            params={"timeout": timeout},
        )
        try: