diff --git a/litellm/tests/test_caching.py b/litellm/tests/test_caching.py
index a223d5923..91da1565f 100644
--- a/litellm/tests/test_caching.py
+++ b/litellm/tests/test_caching.py
@@ -352,98 +352,98 @@ def test_hosted_cache():
 # test_hosted_cache()
 
 
-def test_redis_cache_with_ttl():
-    cache = Cache(type="redis", host=os.environ['REDIS_HOST'], port=os.environ['REDIS_PORT'], password=os.environ['REDIS_PASSWORD'])
-    sample_model_response_object_str = """{
-  "choices": [
-    {
-      "finish_reason": "stop",
-      "index": 0,
-      "message": {
-        "role": "assistant",
-        "content": "I'm doing well, thank you for asking. I am Claude, an AI assistant created by Anthropic."
-      }
-    }
-  ],
-  "created": 1691429984.3852863,
-  "model": "claude-instant-1",
-  "usage": {
-    "prompt_tokens": 18,
-    "completion_tokens": 23,
-    "total_tokens": 41
-  }
-}"""
-    sample_model_response_object = {
-  "choices": [
-    {
-      "finish_reason": "stop",
-      "index": 0,
-      "message": {
-        "role": "assistant",
-        "content": "I'm doing well, thank you for asking. I am Claude, an AI assistant created by Anthropic."
-      }
-    }
-  ],
-  "created": 1691429984.3852863,
-  "model": "claude-instant-1",
-  "usage": {
-    "prompt_tokens": 18,
-    "completion_tokens": 23,
-    "total_tokens": 41
-  }
-}
-    cache.add_cache(cache_key="test_key", result=sample_model_response_object_str, ttl=1)
-    cached_value = cache.get_cache(cache_key="test_key")
-    print(f"cached-value: {cached_value}")
-    assert cached_value['choices'][0]['message']['content'] == sample_model_response_object['choices'][0]['message']['content']
-    time.sleep(2)
-    assert cache.get_cache(cache_key="test_key") is None
+# def test_redis_cache_with_ttl():
+#     cache = Cache(type="redis", host=os.environ['REDIS_HOST'], port=os.environ['REDIS_PORT'], password=os.environ['REDIS_PASSWORD'])
+#     sample_model_response_object_str = """{
+#   "choices": [
+#     {
+#       "finish_reason": "stop",
+#       "index": 0,
+#       "message": {
+#         "role": "assistant",
+#         "content": "I'm doing well, thank you for asking. I am Claude, an AI assistant created by Anthropic."
+#       }
+#     }
+#   ],
+#   "created": 1691429984.3852863,
+#   "model": "claude-instant-1",
+#   "usage": {
+#     "prompt_tokens": 18,
+#     "completion_tokens": 23,
+#     "total_tokens": 41
+#   }
+# }"""
+#     sample_model_response_object = {
+#   "choices": [
+#     {
+#       "finish_reason": "stop",
+#       "index": 0,
+#       "message": {
+#         "role": "assistant",
+#         "content": "I'm doing well, thank you for asking. I am Claude, an AI assistant created by Anthropic."
+#       }
+#     }
+#   ],
+#   "created": 1691429984.3852863,
+#   "model": "claude-instant-1",
+#   "usage": {
+#     "prompt_tokens": 18,
+#     "completion_tokens": 23,
+#     "total_tokens": 41
+#   }
+# }
+#     cache.add_cache(cache_key="test_key", result=sample_model_response_object_str, ttl=1)
+#     cached_value = cache.get_cache(cache_key="test_key")
+#     print(f"cached-value: {cached_value}")
+#     assert cached_value['choices'][0]['message']['content'] == sample_model_response_object['choices'][0]['message']['content']
+#     time.sleep(2)
+#     assert cache.get_cache(cache_key="test_key") is None
 
-# test_redis_cache_with_ttl()
+# # test_redis_cache_with_ttl()
 
-def test_in_memory_cache_with_ttl():
-    cache = Cache(type="local")
-    sample_model_response_object_str = """{
-  "choices": [
-    {
-      "finish_reason": "stop",
-      "index": 0,
-      "message": {
-        "role": "assistant",
-        "content": "I'm doing well, thank you for asking. I am Claude, an AI assistant created by Anthropic."
-      }
-    }
-  ],
-  "created": 1691429984.3852863,
-  "model": "claude-instant-1",
-  "usage": {
-    "prompt_tokens": 18,
-    "completion_tokens": 23,
-    "total_tokens": 41
-  }
-}"""
-    sample_model_response_object = {
-  "choices": [
-    {
-      "finish_reason": "stop",
-      "index": 0,
-      "message": {
-        "role": "assistant",
-        "content": "I'm doing well, thank you for asking. I am Claude, an AI assistant created by Anthropic."
-      }
-    }
-  ],
-  "created": 1691429984.3852863,
-  "model": "claude-instant-1",
-  "usage": {
-    "prompt_tokens": 18,
-    "completion_tokens": 23,
-    "total_tokens": 41
-  }
-}
-    cache.add_cache(cache_key="test_key", result=sample_model_response_object_str, ttl=1)
-    cached_value = cache.get_cache(cache_key="test_key")
-    assert cached_value['choices'][0]['message']['content'] == sample_model_response_object['choices'][0]['message']['content']
-    time.sleep(2)
-    assert cache.get_cache(cache_key="test_key") is None
-# test_in_memory_cache_with_ttl()
\ No newline at end of file
+# def test_in_memory_cache_with_ttl():
+#     cache = Cache(type="local")
+#     sample_model_response_object_str = """{
+#   "choices": [
+#     {
+#       "finish_reason": "stop",
+#       "index": 0,
+#       "message": {
+#         "role": "assistant",
+#         "content": "I'm doing well, thank you for asking. I am Claude, an AI assistant created by Anthropic."
+#       }
+#     }
+#   ],
+#   "created": 1691429984.3852863,
+#   "model": "claude-instant-1",
+#   "usage": {
+#     "prompt_tokens": 18,
+#     "completion_tokens": 23,
+#     "total_tokens": 41
+#   }
+# }"""
+#     sample_model_response_object = {
+#   "choices": [
+#     {
+#       "finish_reason": "stop",
+#       "index": 0,
+#       "message": {
+#         "role": "assistant",
+#         "content": "I'm doing well, thank you for asking. I am Claude, an AI assistant created by Anthropic."
+#       }
+#     }
+#   ],
+#   "created": 1691429984.3852863,
+#   "model": "claude-instant-1",
+#   "usage": {
+#     "prompt_tokens": 18,
+#     "completion_tokens": 23,
+#     "total_tokens": 41
+#   }
+# }
+#     cache.add_cache(cache_key="test_key", result=sample_model_response_object_str, ttl=1)
+#     cached_value = cache.get_cache(cache_key="test_key")
+#     assert cached_value['choices'][0]['message']['content'] == sample_model_response_object['choices'][0]['message']['content']
+#     time.sleep(2)
+#     assert cache.get_cache(cache_key="test_key") is None
+# # test_in_memory_cache_with_ttl()
\ No newline at end of file
diff --git a/litellm/tests/test_client.py b/litellm/tests/test_client.py
index 709273363..123e2b3cd 100644
--- a/litellm/tests/test_client.py
+++ b/litellm/tests/test_client.py
@@ -1,90 +1,90 @@
-#### What this tests ####
-#    This tests error logging (with custom user functions) for the `completion` + `embedding` endpoints w/ callbacks
-# This only tests posthog, sentry, and helicone
-import sys, os
-import traceback
-import pytest
+# #### What this tests ####
+# #    This tests error logging (with custom user functions) for the `completion` + `embedding` endpoints w/ callbacks
+# # This only tests posthog, sentry, and helicone
+# import sys, os
+# import traceback
+# import pytest
 
-sys.path.insert(
-    0, os.path.abspath("../..")
-)  # Adds the parent directory to the system path
-import litellm
-from litellm import embedding, completion
+# sys.path.insert(
+#     0, os.path.abspath("../..")
+# )  # Adds the parent directory to the system path
+# import litellm
+# from litellm import embedding, completion
 
-litellm.success_callback = ["posthog", "helicone"]
-litellm.failure_callback = ["sentry", "posthog"]
+# litellm.success_callback = ["posthog", "helicone"]
+# litellm.failure_callback = ["sentry", "posthog"]
 
-litellm.set_verbose = True
+# litellm.set_verbose = True
 
 
-def logger_fn(model_call_object: dict):
-    # print(f"model call details: {model_call_object}")
-    pass
+# def logger_fn(model_call_object: dict):
+#     # print(f"model call details: {model_call_object}")
+#     pass
 
 
-user_message = "Hello, how are you?"
-messages = [{"content": user_message, "role": "user"}]
+# user_message = "Hello, how are you?"
+# messages = [{"content": user_message, "role": "user"}]
 
 
-def test_completion_openai():
-    try:
-        print("running query")
-        response = completion(
-            model="gpt-3.5-turbo", messages=messages, logger_fn=logger_fn
-        )
-        print(f"response: {response}")
-        # Add any assertions here to check the response
-    except Exception as e:
-        traceback.print_exc()
-        pytest.fail(f"Error occurred: {e}")
-
-
-def test_completion_claude():
-    try:
-        response = completion(
-            model="claude-instant-1", messages=messages, logger_fn=logger_fn
-        )
-        # Add any assertions here to check the response
-    except Exception as e:
-        pytest.fail(f"Error occurred: {e}")
-
-
-def test_completion_non_openai():
-    try:
-        response = completion(
-            model="claude-instant-1", messages=messages, logger_fn=logger_fn
-        )
-        # Add any assertions here to check the response
-    except Exception as e:
-        pytest.fail(f"Error occurred: {e}")
-
-
-def test_embedding_openai():
-    try:
-        response = embedding(
-            model="text-embedding-ada-002", input=[user_message], logger_fn=logger_fn
-        )
-        # Add any assertions here to check the response
-        print(f"response: {str(response)[:50]}")
-    except Exception as e:
-        pytest.fail(f"Error occurred: {e}")
-
-
-def test_bad_azure_embedding():
-    try:
-        response = embedding(
-            model="chatgpt-test", input=[user_message], logger_fn=logger_fn
-        )
-        # Add any assertions here to check the response
-        print(f"response: {str(response)[:50]}")
-    except Exception as e:
-        pass
-
-
-# def test_good_azure_embedding():
+# def test_completion_openai():
 #     try:
-#         response = embedding(model='azure/azure-embedding-model', input=[user_message], logger_fn=logger_fn)
+#         print("running query")
+#         response = completion(
+#             model="gpt-3.5-turbo", messages=messages, logger_fn=logger_fn
+#         )
+#         print(f"response: {response}")
+#         # Add any assertions here to check the response
+#     except Exception as e:
+#         traceback.print_exc()
+#         pytest.fail(f"Error occurred: {e}")
+
+
+# def test_completion_claude():
+#     try:
+#         response = completion(
+#             model="claude-instant-1", messages=messages, logger_fn=logger_fn
+#         )
+#         # Add any assertions here to check the response
+#     except Exception as e:
+#         pytest.fail(f"Error occurred: {e}")
+
+
+# def test_completion_non_openai():
+#     try:
+#         response = completion(
+#             model="claude-instant-1", messages=messages, logger_fn=logger_fn
+#         )
+#         # Add any assertions here to check the response
+#     except Exception as e:
+#         pytest.fail(f"Error occurred: {e}")
+
+
+# def test_embedding_openai():
+#     try:
+#         response = embedding(
+#             model="text-embedding-ada-002", input=[user_message], logger_fn=logger_fn
+#         )
 #         # Add any assertions here to check the response
 #         print(f"response: {str(response)[:50]}")
 #     except Exception as e:
 #         pytest.fail(f"Error occurred: {e}")
+
+
+# def test_bad_azure_embedding():
+#     try:
+#         response = embedding(
+#             model="chatgpt-test", input=[user_message], logger_fn=logger_fn
+#         )
+#         # Add any assertions here to check the response
+#         print(f"response: {str(response)[:50]}")
+#     except Exception as e:
+#         pass
+
+
+# # def test_good_azure_embedding():
+# #     try:
+# #         response = embedding(model='azure/azure-embedding-model', input=[user_message], logger_fn=logger_fn)
+# #         # Add any assertions here to check the response
+# #         print(f"response: {str(response)[:50]}")
+# #     except Exception as e:
+# #         pytest.fail(f"Error occurred: {e}")
diff --git a/litellm/tests/test_router.py b/litellm/tests/test_router.py
index 3f3e8a24b..543c3e3ea 100644
--- a/litellm/tests/test_router.py
+++ b/litellm/tests/test_router.py
@@ -56,82 +56,82 @@ load_dotenv()
 # test_openai_only()
 
 
-def test_multiple_deployments(): 
-	import concurrent
-	# litellm.set_verbose=True
-	futures = {}
-	model_list = [{ # list of model deployments 
-		"model_name": "gpt-3.5-turbo", # openai model name 
-		"litellm_params": { # params for litellm completion/embedding call 
-			"model": "azure/chatgpt-v-2", 
-			"api_key": os.getenv("AZURE_API_KEY"),
-			"api_version": os.getenv("AZURE_API_VERSION"),
-			"api_base": os.getenv("AZURE_API_BASE")
-		},
-		"tpm": 240000,
-		"rpm": 1800
-	}, {
-		"model_name": "gpt-3.5-turbo", # openai model name 
-		"litellm_params": { # params for litellm completion/embedding call 
-			"model": "azure/chatgpt-functioncalling", 
-			"api_key": os.getenv("AZURE_API_KEY"),
-			"api_version": os.getenv("AZURE_API_VERSION"),
-			"api_base": os.getenv("AZURE_API_BASE")
-		},
-		"tpm": 240000,
-		"rpm": 1800
-	}, {
-		"model_name": "gpt-3.5-turbo", # openai model name 
-		"litellm_params": { # params for litellm completion/embedding call 
-			"model": "gpt-3.5-turbo", 
-			"api_key": os.getenv("OPENAI_API_KEY"),
-		},
-		"tpm": 1000000,
-		"rpm": 9000
-	}]
+# def test_multiple_deployments(): 
+# 	import concurrent
+# 	# litellm.set_verbose=True
+# 	futures = {}
+# 	model_list = [{ # list of model deployments 
+# 		"model_name": "gpt-3.5-turbo", # openai model name 
+# 		"litellm_params": { # params for litellm completion/embedding call 
+# 			"model": "azure/chatgpt-v-2", 
+# 			"api_key": os.getenv("AZURE_API_KEY"),
+# 			"api_version": os.getenv("AZURE_API_VERSION"),
+# 			"api_base": os.getenv("AZURE_API_BASE")
+# 		},
+# 		"tpm": 240000,
+# 		"rpm": 1800
+# 	}, {
+# 		"model_name": "gpt-3.5-turbo", # openai model name 
+# 		"litellm_params": { # params for litellm completion/embedding call 
+# 			"model": "azure/chatgpt-functioncalling", 
+# 			"api_key": os.getenv("AZURE_API_KEY"),
+# 			"api_version": os.getenv("AZURE_API_VERSION"),
+# 			"api_base": os.getenv("AZURE_API_BASE")
+# 		},
+# 		"tpm": 240000,
+# 		"rpm": 1800
+# 	}, {
+# 		"model_name": "gpt-3.5-turbo", # openai model name 
+# 		"litellm_params": { # params for litellm completion/embedding call 
+# 			"model": "gpt-3.5-turbo", 
+# 			"api_key": os.getenv("OPENAI_API_KEY"),
+# 		},
+# 		"tpm": 1000000,
+# 		"rpm": 9000
+# 	}]
 
-	router = Router(model_list=model_list, redis_host=os.getenv("REDIS_HOST"), redis_password=os.getenv("REDIS_PASSWORD"), redis_port=int(os.getenv("REDIS_PORT"))) # type: ignore
+# 	router = Router(model_list=model_list, redis_host=os.getenv("REDIS_HOST"), redis_password=os.getenv("REDIS_PASSWORD"), redis_port=int(os.getenv("REDIS_PORT"))) # type: ignore
 
-	results = [] 
-	with ThreadPoolExecutor(max_workers=10) as executor:
-		kwargs = {
-			"model": "gpt-3.5-turbo",
-			"messages": [{"role": "user", "content": """Context:
+# 	results = [] 
+# 	with ThreadPoolExecutor(max_workers=10) as executor:
+# 		kwargs = {
+# 			"model": "gpt-3.5-turbo",
+# 			"messages": [{"role": "user", "content": """Context:
 
-In the historical era of Ancient Greece, a multitude of significant individuals lived, contributing immensely to various disciplines like science, politics, philosophy, and literature. For instance, Socrates, a renowned philosopher, primarily focused on ethics. His notable method, the Socratic Method, involved acknowledging one's own ignorance to stimulate critical thinking and illuminate ideas. His student, Plato, another prominent figure, founded the Academy in Athens. He proposed theories on justice, beauty, and equality, and also introduced the theory of forms, which is pivotal to understanding his philosophical insights. Another student of Socrates, Xenophon, distinguished himself more in the domain of history and military affairs.
+# In the historical era of Ancient Greece, a multitude of significant individuals lived, contributing immensely to various disciplines like science, politics, philosophy, and literature. For instance, Socrates, a renowned philosopher, primarily focused on ethics. His notable method, the Socratic Method, involved acknowledging one's own ignorance to stimulate critical thinking and illuminate ideas. His student, Plato, another prominent figure, founded the Academy in Athens. He proposed theories on justice, beauty, and equality, and also introduced the theory of forms, which is pivotal to understanding his philosophical insights. Another student of Socrates, Xenophon, distinguished himself more in the domain of history and military affairs.
 
-Aristotle, who studied under Plato, led an equally remarkable life. His extensive works have been influential across various domains, including science, logic, metaphysics, ethics, and politics. Perhaps most notably, a substantial portion of the Western intellectual tradition traces back to his writings. He later tutored Alexander the Great who went on to create one of the most vast empires in the world.
+# Aristotle, who studied under Plato, led an equally remarkable life. His extensive works have been influential across various domains, including science, logic, metaphysics, ethics, and politics. Perhaps most notably, a substantial portion of the Western intellectual tradition traces back to his writings. He later tutored Alexander the Great who went on to create one of the most vast empires in the world.
 
-In the domain of mathematics, Pythagoras and Euclid made significant contributions. Pythagoras is best known for the Pythagorean theorem, a fundamental principle in geometry, while Euclid, often regarded as the father of geometry, wrote "The Elements", a collection of definitions, axioms, theorems, and proofs. 
+# In the domain of mathematics, Pythagoras and Euclid made significant contributions. Pythagoras is best known for the Pythagorean theorem, a fundamental principle in geometry, while Euclid, often regarded as the father of geometry, wrote "The Elements", a collection of definitions, axioms, theorems, and proofs. 
 
-Apart from these luminaries, the period also saw a number of influential political figures. Pericles, a prominent and influential Greek statesman, orator, and general of Athens during the Golden Age, specifically between the Persian and Peloponnesian wars, played a significant role in developing the Athenian democracy.
+# Apart from these luminaries, the period also saw a number of influential political figures. Pericles, a prominent and influential Greek statesman, orator, and general of Athens during the Golden Age, specifically between the Persian and Peloponnesian wars, played a significant role in developing the Athenian democracy.
 
-The Ancient Greek era also witnessed extraordinary advancements in arts and literature. Homer, credited with the creation of the epic poems 'The Iliad' and 'The Odyssey,' is considered one of the greatest poets in history. The tragedies of Sophocles, Aeschylus, and Euripides left an indelible mark on the field of drama, and the comedies of Aristophanes remain influential even today.
+# The Ancient Greek era also witnessed extraordinary advancements in arts and literature. Homer, credited with the creation of the epic poems 'The Iliad' and 'The Odyssey,' is considered one of the greatest poets in history. The tragedies of Sophocles, Aeschylus, and Euripides left an indelible mark on the field of drama, and the comedies of Aristophanes remain influential even today.
 
----
-Question: 
+# ---
+# Question: 
 
-Who among the mentioned figures from Ancient Greece contributed to the domain of mathematics and what are their significant contributions?"""}],
-		}
-		for _ in range(10):
-			future = executor.submit(router.completion, **kwargs)
-			futures[future] = future
+# Who among the mentioned figures from Ancient Greece contributed to the domain of mathematics and what are their significant contributions?"""}],
+# 		}
+# 		for _ in range(10):
+# 			future = executor.submit(router.completion, **kwargs)
+# 			futures[future] = future
 
-		# Retrieve the results from the futures
-		while futures:
-			done, not_done = concurrent.futures.wait(futures, return_when=concurrent.futures.FIRST_COMPLETED)
-			for future in done:
-				try:
-					result = future.result()
-					print(f"result: {result}")
-					results.append(result)
-					del futures[future]
-				except Exception as e:
-					print(f"Exception: {e}; traceback: {traceback.format_exc()}")
-					del futures[future]  # remove the done future
+# 		# Retrieve the results from the futures
+# 		while futures:
+# 			done, not_done = concurrent.futures.wait(futures, return_when=concurrent.futures.FIRST_COMPLETED)
+# 			for future in done:
+# 				try:
+# 					result = future.result()
+# 					print(f"result: {result}")
+# 					results.append(result)
+# 					del futures[future]
+# 				except Exception as e:
+# 					print(f"Exception: {e}; traceback: {traceback.format_exc()}")
+# 					del futures[future]  # remove the done future
 
-		# Check results
-		print(results)
+# 		# Check results
+# 		print(results)
 
 
 # test_multiple_deployments()
diff --git a/litellm/tests/test_streaming.py b/litellm/tests/test_streaming.py
index bb899b259..4382ef0e0 100644
--- a/litellm/tests/test_streaming.py
+++ b/litellm/tests/test_streaming.py
@@ -518,6 +518,7 @@ def test_completion_palm_stream():
 
 def test_completion_claude_stream_bad_key():
     try:
+        litellm.cache = None
         api_key = "bad-key"
         messages = [
             {"role": "system", "content": "You are a helpful assistant."},
@@ -538,14 +539,15 @@ def test_completion_claude_stream_bad_key():
             complete_response += chunk
         if complete_response.strip() == "": 
             raise Exception("Empty response received")
-        print(f"completion_response: {complete_response}")
+        print(f"1234completion_response: {complete_response}")
+        raise Exception("Auth error not raised")
     except AuthenticationError as e:
-        pass
+        print("Auth Error raised")
     except Exception as e:
         pytest.fail(f"Error occurred: {e}")
 
 
-# test_completion_claude_stream_bad_key() 
+test_completion_claude_stream_bad_key() 
 # test_completion_replicate_stream()
 
 # def test_completion_vertexai_stream():
@@ -912,7 +914,7 @@ def test_openai_chat_completion_complete_response_call():
         print(f"error occurred: {traceback.format_exc()}")
         pass
 
-test_openai_chat_completion_complete_response_call()
+# test_openai_chat_completion_complete_response_call()
 
 def test_openai_text_completion_call():
     try: