(test) Router: Test Azure acompletion, stream

2025-04-27 11:43:54 +00:00 · 2023-12-05 13:22:27 -08:00 · 2023-12-05 13:22:27 -08:00 · e579918dd9
commit e579918dd9
parent 58ab0a3f03
1 changed files with 83 additions and 0 deletions
--- a/litellm/tests/test_router.py
+++ b/litellm/tests/test_router.py
@ -139,6 +139,89 @@ def test_reading_key_from_model_list():
 # test_reading_key_from_model_list()
 def test_router_azure_acompletion():
 	# [PROD TEST CASE]
 	# This is 90% of the router use case, makes an acompletion call, acompletion + stream call and verifies it got a response
 	# DO NOT REMOVE THIS TEST. It's an IMP ONE. Speak to Ishaan, if you are tring to remove this
 	litellm.set_verbose=False
 	import openai
 	try:
 		print("Router Test Azure - Acompletion, Acompletion with stream")
 		# remove api key from env to repro how proxy passes key to router 
 		old_api_key = os.environ["AZURE_API_KEY"]
 		os.environ.pop("AZURE_API_KEY", None)
 		model_list = [
 			{ 
 				"model_name": "gpt-3.5-turbo", # openai model name 
 				"litellm_params": { # params for litellm completion/embedding call 
 					"model": "azure/chatgpt-v-2", 
 					"api_key": old_api_key,
 					"api_version": os.getenv("AZURE_API_VERSION"),
 					"api_base": os.getenv("AZURE_API_BASE")
 				},
 				"tpm": 240000,
 				"rpm": 1800
 			},
 			{
 				"model_name": "gpt-3.5-turbo", # openai model name 
 				"litellm_params": { # params for litellm completion/embedding call 
 					"model": "azure/chatgpt-v-2", 
 					"api_key": old_api_key,
 					"api_version": os.getenv("AZURE_API_VERSION"),
 					"api_base": os.getenv("AZURE_API_BASE")
 				},
 				"tpm": 240000,
 				"rpm": 1800
 			}
 		]
 		router = Router(model_list=model_list, 
 					routing_strategy="simple-shuffle",
 					set_verbose=True
 				) # type: ignore
 		async def test1():
 			response = await router.acompletion(
 				model="gpt-3.5-turbo",
 				messages=[
 					{
 						"role": "user",
 						"content": "hello this request will fail"
 					}
 				]
 			)
 			print("\n response", response)
 		asyncio.run(test1())
 		print("\n Testing streaming response")
 		async def test2():
 			response = await router.acompletion(
 				model="gpt-3.5-turbo",
 				messages=[
 					{
 						"role": "user",
 						"content": "hello this request will fail"
 					}
 				],
 				stream=True
 			)
 			async for chunk in response:
 				if chunk is not None:
 					print(chunk)
 		asyncio.run(test2())
 		print("\n Passed Streaming")
 		os.environ["AZURE_API_KEY"] = old_api_key
 		router.reset()
 	except Exception as e:
 		os.environ["AZURE_API_KEY"] = old_api_key
 		print(f"FAILED TEST")
 		pytest.fail(f"Got unexpected exception on router! - {e}")
 test_router_azure_acompletion()
 ### FUNCTION CALLING 
 def test_function_calling():