update to expose longer_context_model_fallback_dict

2023-09-25 20:30:12 -07:00 · 2023-09-25 20:30:12 -07:00 · e9747fb763
commit e9747fb763
parent 10dc3f735e
5 changed files with 43 additions and 4 deletions
--- a/docs/my-website/docs/completion/reliable_completions.md
+++ b/docs/my-website/docs/completion/reliable_completions.md
@ -1,10 +1,36 @@
 # Reliability
 ## Helper utils 
 LiteLLM supports the following functions for reliability:
 * `litellm.longer_context_model_fallback_dict`: Dictionary which has a mapping for those models which have larger equivalents  
 * `completion_with_retries`: use tenacity retries
 * `completion()` with fallback models: set `fallback_models=['gpt-3.5-turbo', 'command-nightly', 'llama2`]. If primary model fails try fallback models
-## Completion with Retries
+## Context Window Errors 
 ```python 
 from litellm import longer_context_model_fallback_dict, ContextWindowExceededError
 sample_text = "how does a court case get to the Supreme Court?" * 1000
 messages = [{"content": user_message, "role": "user"}]
 model = "gpt-3.5-turbo"
 try: 
    # try the original model
    response = completion(model=model, messages=messages) 
 # catch the context window error
 except ContextWindowExceededError as e:
    if model in longer_context_model_fallback_dict: 
        # switch to the equivalent larger model -> gpt.3.5-turbo-16k 
        new_model = longer_context_model_fallback_dict[model]
        response = completion(new_model, messages)
 print(response)
 ```
 ## Retry failed requests
 You can use this as a drop-in replacement for the `completion()` function to use tenacity retries - by default we retry the call 3 times. 
@ -29,7 +55,7 @@ def test_completion_custom_provider_model_name():
        printf"Error occurred: {e}")
 ```
-## Completion with Fallbacks
+## Specify fallback models
 LLM APIs can be unstable, completion() with fallbacks ensures you'll always get a response from your calls
 ## Usage 
--- a/litellm/init.py
+++ b/litellm/init.py
@ -261,7 +261,7 @@ models_by_provider: dict = {
 }
 # mapping for those models which have larger equivalents 
-longer_context_model_fallback_dict = {
+longer_context_model_fallback_dict: dict = {
    # openai chat completion models
    "gpt-3.5-turbo": "gpt-3.5-turbo-16k", 
    "gpt-3.5-turbo-0301": "gpt-3.5-turbo-16k-0301", 
--- a/litellm/pycache/init.cpython-311.pyc
+++ b/litellm/pycache/init.cpython-311.pyc
--- a/litellm/tests/test_longer_context_fallback.py
+++ b/litellm/tests/test_longer_context_fallback.py
@ -0,0 +1,13 @@
 #### What this tests ####
 #    This tests context fallback dict
 import sys, os
 import traceback
 import pytest
 sys.path.insert(
    0, os.path.abspath("../..")
 )  # Adds the parent directory to the system path
 import litellm
 from litellm import longer_context_model_fallback_dict
 print(longer_context_model_fallback_dict)
--- a/pyproject.toml
+++ b/pyproject.toml
@ -1,6 +1,6 @@
 [tool.poetry]
 name = "litellm"
-version = "0.1.749"
+version = "0.1.750"
 description = "Library to easily interface with LLM API providers"
 authors = ["BerriAI"]
 license = "MIT License"