mirror of
https://github.com/BerriAI/litellm.git
synced 2025-04-25 18:54:30 +00:00
94 lines
2.5 KiB
Python
94 lines
2.5 KiB
Python
#### What this tests ####
|
|
# This tests streaming for the completion endpoint
|
|
|
|
import sys, os
|
|
import traceback
|
|
import time
|
|
sys.path.insert(
|
|
0, os.path.abspath("../..")
|
|
) # Adds the parent directory to the system path
|
|
import litellm
|
|
from litellm import completion
|
|
|
|
litellm.set_verbose = True
|
|
|
|
score = 0
|
|
|
|
|
|
def logger_fn(model_call_object: dict):
|
|
print(f"model call details: {model_call_object}")
|
|
|
|
|
|
user_message = "Hello, how are you?"
|
|
messages = [{"content": user_message, "role": "user"}]
|
|
|
|
# test on anthropic completion call
|
|
try:
|
|
start_time = time.time()
|
|
response = completion(
|
|
model="claude-instant-1", messages=messages, stream=True, logger_fn=logger_fn
|
|
)
|
|
for chunk in response:
|
|
chunk_time = time.time()
|
|
print(f"time since initial request: {chunk_time - start_time:.2f}")
|
|
print(chunk["choices"][0]["delta"])
|
|
score += 1
|
|
except:
|
|
print(f"error occurred: {traceback.format_exc()}")
|
|
pass
|
|
|
|
# # test on openai completion call
|
|
# try:
|
|
# response = completion(
|
|
# model="gpt-3.5-turbo", messages=messages, stream=True, logger_fn=logger_fn
|
|
# )
|
|
# for chunk in response:
|
|
# print(chunk["choices"][0]["delta"])
|
|
# score += 1
|
|
# except:
|
|
# print(f"error occurred: {traceback.format_exc()}")
|
|
# pass
|
|
|
|
|
|
# # test on azure completion call
|
|
# try:
|
|
# response = completion(
|
|
# model="azure/chatgpt-test", messages=messages, stream=True, logger_fn=logger_fn
|
|
# )
|
|
# for chunk in response:
|
|
# print(chunk["choices"][0]["delta"])
|
|
# score += 1
|
|
# except:
|
|
# print(f"error occurred: {traceback.format_exc()}")
|
|
# pass
|
|
|
|
|
|
# # test on anthropic completion call
|
|
# try:
|
|
# response = completion(
|
|
# model="claude-instant-1", messages=messages, stream=True, logger_fn=logger_fn
|
|
# )
|
|
# for chunk in response:
|
|
# print(chunk["choices"][0]["delta"])
|
|
# score += 1
|
|
# except:
|
|
# print(f"error occurred: {traceback.format_exc()}")
|
|
# pass
|
|
|
|
|
|
# # # test on huggingface completion call
|
|
# # try:
|
|
# # response = completion(
|
|
# # model="meta-llama/Llama-2-7b-chat-hf",
|
|
# # messages=messages,
|
|
# # custom_llm_provider="huggingface",
|
|
# # custom_api_base="https://s7c7gytn18vnu4tw.us-east-1.aws.endpoints.huggingface.cloud",
|
|
# # stream=True,
|
|
# # logger_fn=logger_fn,
|
|
# # )
|
|
# # for chunk in response:
|
|
# # print(chunk["choices"][0]["delta"])
|
|
# # score += 1
|
|
# # except:
|
|
# # print(f"error occurred: {traceback.format_exc()}")
|
|
# # pass
|