fix(main.py): don't set timeout as an optional api param

2023-12-30 11:46:51 +05:30 · 2023-12-30 11:46:51 +05:30 · 77be3e3114
commit 77be3e3114
parent aee38d9329
4 changed files with 9 additions and 30 deletions
--- a/litellm/llms/openai.py
+++ b/litellm/llms/openai.py
@ -382,6 +382,7 @@ class OpenAIChatCompletion(BaseLLM):
                    "complete_input_dict": data,
                },
            )
            response = await openai_aclient.chat.completions.create(**data)
            stringified_response = response.model_dump_json()
            logging_obj.post_call(
--- a/litellm/main.py
+++ b/litellm/main.py
@ -574,7 +574,6 @@ def completion(
            max_retries=max_retries,
            logprobs=logprobs,
            top_logprobs=top_logprobs,
            timeout=timeout,
            **non_default_params,
        )
--- a/litellm/tests/test_async_fn.py
+++ b/litellm/tests/test_async_fn.py
@ -195,7 +195,7 @@ def test_get_cloudflare_response_streaming():
    asyncio.run(test_async_call())
-test_get_cloudflare_response_streaming()
+# test_get_cloudflare_response_streaming()
 def test_get_response_streaming():
--- a/litellm/utils.py
+++ b/litellm/utils.py
@ -2910,7 +2910,6 @@ def get_optional_params(
    max_retries=None,
    logprobs=None,
    top_logprobs=None,
    timeout=None,
    **kwargs,
 ):
    # retrieve all parameters passed to the function
@ -2940,7 +2939,6 @@ def get_optional_params(
        "max_retries": None,
        "logprobs": None,
        "top_logprobs": None,
        "timeout": 600,
    }
    # filter out those parameters that were passed with non-default values
    non_default_params = {
@ -3734,7 +3732,6 @@ def get_optional_params(
            "max_retries",
            "logprobs",
            "top_logprobs",
            "timeout",
        ]
        _check_valid_arg(supported_params=supported_params)
        if functions is not None:
@ -3775,8 +3772,6 @@ def get_optional_params(
            optional_params["logprobs"] = logprobs
        if top_logprobs is not None:
            optional_params["top_logprobs"] = top_logprobs
        if timeout is not None:
            optional_params["timeout"] = timeout
    # if user passed in non-default kwargs for specific providers/models, pass them along
    for k in passed_params.keys():
        if k not in default_params.keys():
@ -6539,12 +6534,14 @@ class CustomStreamWrapper:
        self.special_tokens = ["<|assistant|>", "<|system|>", "<|user|>", "<s>", "</s>"]
        self.holding_chunk = ""
        self.complete_response = ""
-        self._hidden_params = {
+        _model_info = (
-            "model_id": (
+            self.logging_obj.model_call_details.get("litellm_params", {}).get(
-                self.logging_obj.model_call_details.get("litellm_params", {})
+                "model_info", {}
                .get("model_info", {})
                .get("id", None)
            )
            or {}
        )
        self._hidden_params = {
            "model_id": (_model_info.get("id", None))
        }  # returned as x-litellm-model-id response header in proxy
    def __iter__(self):
@ -7437,14 +7434,6 @@ class CustomStreamWrapper:
                        target=self.logging_obj.success_handler, args=(response,)
                    ).start()  # log response
                    # RETURN RESULT
                    if hasattr(response, "_hidden_params"):
                        response._hidden_params["model_id"] = (
                            self.logging_obj.model_call_details.get(
                                "litellm_params", {}
                            )
                            .get("model_info", {})
                            .get("id", None)
                        )
                    return response
        except StopIteration:
            raise  # Re-raise StopIteration
@ -7495,16 +7484,6 @@ class CustomStreamWrapper:
                            processed_chunk,
                        )
                    )
                    # RETURN RESULT
                    if hasattr(processed_chunk, "_hidden_params"):
                        model_id = (
                            self.logging_obj.model_call_details.get(
                                "litellm_params", {}
                            )
                            .get("model_info", {})
                            .get("id", None)
                        )
                        processed_chunk._hidden_params["model_id"] = model_id
                    return processed_chunk
                raise StopAsyncIteration
            else:  # temporary patch for non-aiohttp async calls