From c4bda13820ee6c25ca9a02ad596e495b41f9981e Mon Sep 17 00:00:00 2001
From: ishaan-jaff <ishaanjaffer0324@gmail.com>
Date: Tue, 5 Dec 2023 15:32:15 -0800
Subject: [PATCH] (fix) sagemaker Llama-2 70b

---
 litellm/utils.py | 4 +++-
 1 file changed, 3 insertions(+), 1 deletion(-)

diff --git a/litellm/utils.py b/litellm/utils.py
index e8e2b57b3..f419ebcd3 100644
--- a/litellm/utils.py
+++ b/litellm/utils.py
@@ -2206,7 +2206,9 @@ def get_optional_params(  # use the openai defaults
         if max_tokens is not None:
             optional_params["max_output_tokens"] = max_tokens
     elif custom_llm_provider == "sagemaker":
-        if "llama-2" in model:
+        if "llama-2" in model.lower() or (
+            "llama" in model.lower() and "2" in model.lower() # some combination of llama and "2" should exist
+        ): # jumpstart can also send "Llama-2-70b-chat-hf-48xlarge"
             # llama-2 models on sagemaker support the following args
             """
             max_new_tokens: Model generates text until the output length (excluding the input context length) reaches max_new_tokens. If specified, it must be a positive integer.