adding tenacity retries

2023-08-03 10:06:31 -07:00 · 2023-08-03 10:06:31 -07:00 · a8b3fc6c2d
commit a8b3fc6c2d
parent 10832be1e4
12 changed files with 37 additions and 11 deletions
--- a/litellm/init.py
+++ b/litellm/init.py
@ -3,6 +3,7 @@ failure_callback = []
 set_verbose=False
 telemetry=True
 max_tokens = 256 # OpenAI Defaults
+retry = True # control tenacity retries. 
 ####### PROXY PARAMS ################### configurable params if you use proxy models like Helicone
 api_base = None
 headers = None
--- a/litellm/pycache/init.cpython-311.pyc
+++ b/litellm/pycache/init.cpython-311.pyc
--- a/litellm/pycache/main.cpython-311.pyc
+++ b/litellm/pycache/main.cpython-311.pyc
--- a/litellm/pycache/timeout.cpython-311.pyc
+++ b/litellm/pycache/timeout.cpython-311.pyc
--- a/litellm/pycache/utils.cpython-311.pyc
+++ b/litellm/pycache/utils.cpython-311.pyc
--- a/litellm/integrations/pycache/init.cpython-311.pyc
+++ b/litellm/integrations/pycache/init.cpython-311.pyc
--- a/litellm/main.py
+++ b/litellm/main.py
@ -7,6 +7,11 @@ import traceback
 import litellm
 from litellm import client, logging, exception_type, timeout, success_callback, failure_callback
 import random
+from tenacity import (
+    retry,
+    stop_after_attempt,
+    wait_random_exponential,
+)  # for exponential backoff
 ####### ENVIRONMENT VARIABLES ###################
 dotenv.load_dotenv() # Loading env variables using dotenv

@ -55,6 +60,7 @@ def get_optional_params(
 ####### COMPLETION ENDPOINTS ################
 #############################################
@client
+@retry(wait=wait_random_exponential(min=1, max=60), stop=stop_after_attempt(2), reraise=True, retry_error_callback=lambda retry_state: setattr(retry_state.outcome, 'retry_variable', litellm.retry)) # retry call, turn this off by setting `litellm.retry = False`
@timeout(60) ## set timeouts, in case calls hang (e.g. Azure) - default is 60s, override with `force_timeout`
 def completion(
    model, messages, # required params
--- a/litellm/tests/test_api_key_param.py
+++ b/litellm/tests/test_api_key_param.py
@ -15,13 +15,14 @@ def logger_fn(model_call_object: dict):
 user_message = "Hello, how are you?"
 messages = [{ "content": user_message,"role": "user"}]

+print(os.environ)
 temp_key = os.environ.get("OPENAI_API_KEY")
 os.environ["OPENAI_API_KEY"] = "bad-key"
 # test on openai completion call 
 try:
    response = completion(model="gpt-3.5-turbo", messages=messages, logger_fn=logger_fn, api_key=temp_key)
+    print(f"response: {response}")
 except:
    print(f"error occurred: {traceback.format_exc()}") 
    pass
-
 os.environ["OPENAI_API_KEY"] = temp_key
--- a/litellm/tests/test_bad_params.py
+++ b/litellm/tests/test_bad_params.py
@ -4,7 +4,8 @@

 import sys, os
 import traceback
-
+from dotenv import load_dotenv
+load_dotenv()
 # Get the current directory of the script
 current_dir = os.path.dirname(os.path.abspath(__file__))

@ -19,7 +20,7 @@ import litellm
 from litellm import embedding, completion


-
+litellm.set_verbose = True
 litellm.success_callback = ["posthog"]
 litellm.failure_callback = ["slack", "sentry", "posthog"]

@ -36,3 +37,16 @@ def test_completion_with_empty_model():
    except Exception as e:
        print(f"error occurred: {e}") 
        pass
+
+
+#bad key
+temp_key = os.environ.get("OPENAI_API_KEY")
+os.environ["OPENAI_API_KEY"] = "bad-key"
+# test on openai completion call 
+try:
+    response = completion(model="gpt-3.5-turbo", messages=messages)
+    print(f"response: {response}")
+except:
+    print(f"error occurred: {traceback.format_exc()}") 
+    pass
+os.environ["OPENAI_API_KEY"] = temp_key
--- a/litellm/tests/test_timeout.py
+++ b/litellm/tests/test_timeout.py
@ -18,7 +18,8 @@ start_time = time.time()

 try:
  stop_after_10_s(force_timeout=1)
-except:
+except Exception as e:
+  print(e)
  pass

 end_time = time.time()
--- a/litellm/timeout.py
+++ b/litellm/timeout.py
@ -37,26 +37,29 @@ def timeout(
            thread = _LoopWrapper()
            thread.start()
            future = asyncio.run_coroutine_threadsafe(async_func(), thread.loop)
-            try:
            local_timeout_duration = timeout_duration
            if "force_timeout" in kwargs:
                local_timeout_duration = kwargs["force_timeout"]
+            try:
                result = future.result(timeout=local_timeout_duration)
            except futures.TimeoutError:
                thread.stop_loop()
-                raise exception_to_raise()
+                raise exception_to_raise(f"A timeout error occurred. The function call took longer than {local_timeout_duration} second(s).")
            thread.stop_loop()
            return result

        @wraps(func)
        async def async_wrapper(*args, **kwargs):
+            local_timeout_duration = timeout_duration
+            if "force_timeout" in kwargs:
+                local_timeout_duration = kwargs["force_timeout"]
            try:
                value = await asyncio.wait_for(
                    func(*args, **kwargs), timeout=timeout_duration
                )
                return value
            except asyncio.TimeoutError:
-                raise exception_to_raise()
+                raise exception_to_raise(f"A timeout error occurred. The function call took longer than {local_timeout_duration} second(s).")

        if iscoroutinefunction(func):
            return async_wrapper
--- a/setup.py
+++ b/setup.py
@ -2,7 +2,7 @@ from setuptools import setup, find_packages

 setup(
    name='litellm',
-    version='0.1.226',
+    version='0.1.227',
    description='Library to easily interface with LLM API providers',
    author='BerriAI',
    packages=[