diff --git a/dist/litellm-0.1.487-py3-none-any.whl b/dist/litellm-0.1.487-py3-none-any.whl new file mode 100644 index 000000000..317068196 Binary files /dev/null and b/dist/litellm-0.1.487-py3-none-any.whl differ diff --git a/dist/litellm-0.1.487.tar.gz b/dist/litellm-0.1.487.tar.gz new file mode 100644 index 000000000..cf8462205 Binary files /dev/null and b/dist/litellm-0.1.487.tar.gz differ diff --git a/litellm/tests/test_streaming.py b/litellm/tests/test_streaming.py index 6cad61502..d0da5e4d7 100644 --- a/litellm/tests/test_streaming.py +++ b/litellm/tests/test_streaming.py @@ -9,7 +9,7 @@ sys.path.insert( ) # Adds the parent directory to the system path import litellm from litellm import completion -litellm.logging = False +litellm.logging = True litellm.set_verbose = True score = 0 @@ -22,25 +22,69 @@ def logger_fn(model_call_object: dict): user_message = "Hello, how are you?" messages = [{"content": user_message, "role": "user"}] -# test on anthropic completion call +# test on openai completion call try: - start_time = time.time() response = completion( - model="claude-instant-1", messages=messages, stream=True, logger_fn=logger_fn + model="gpt-3.5-turbo", messages=messages, stream=True, logger_fn=logger_fn ) + response = "" for chunk in response: chunk_time = time.time() print(f"time since initial request: {chunk_time - start_time:.2f}") print(chunk["choices"][0]["delta"]) - score += 1 + response += chunk["choices"][0]["delta"] + if response == "": + raise Exception("Empty response received") except: print(f"error occurred: {traceback.format_exc()}") pass -# # test on openai completion call + +# test on azure completion call +try: + response = completion( + model="azure/chatgpt-test", messages=messages, stream=True, logger_fn=logger_fn + ) + response = "" + for chunk in response: + chunk_time = time.time() + print(f"time since initial request: {chunk_time - start_time:.2f}") + print(chunk["choices"][0]["delta"]) + response += chunk["choices"][0]["delta"] + if response == "": + raise Exception("Empty response received") +except: + print(f"error occurred: {traceback.format_exc()}") + pass + + +# test on anthropic completion call +try: + response = completion( + model="claude-instant-1", messages=messages, stream=True, logger_fn=logger_fn + ) + response = "" + for chunk in response: + chunk_time = time.time() + print(f"time since initial request: {chunk_time - start_time:.2f}") + print(chunk["choices"][0]["delta"]) + response += chunk["choices"][0]["delta"] + if response == "": + raise Exception("Empty response received") +except: + print(f"error occurred: {traceback.format_exc()}") + pass + + +# # test on huggingface completion call # try: # response = completion( -# model="gpt-3.5-turbo", messages=messages, stream=True, logger_fn=logger_fn +# model="meta-llama/Llama-2-7b-chat-hf", +# messages=messages, +# custom_llm_provider="huggingface", +# custom_api_base="https://s7c7gytn18vnu4tw.us-east-1.aws.endpoints.huggingface.cloud", +# stream=True, +# logger_fn=logger_fn, # ) # for chunk in response: # print(chunk["choices"][0]["delta"]) @@ -48,47 +92,3 @@ except: # except: # print(f"error occurred: {traceback.format_exc()}") # pass - - -# # test on azure completion call -# try: -# response = completion( -# model="azure/chatgpt-test", messages=messages, stream=True, logger_fn=logger_fn -# ) -# for chunk in response: -# print(chunk["choices"][0]["delta"]) -# score += 1 -# except: -# print(f"error occurred: {traceback.format_exc()}") -# pass - - -# # test on anthropic completion call -# try: -# response = completion( -# model="claude-instant-1", messages=messages, stream=True, logger_fn=logger_fn -# ) -# for chunk in response: -# print(chunk["choices"][0]["delta"]) -# score += 1 -# except: -# print(f"error occurred: {traceback.format_exc()}") -# pass - - -# # # test on huggingface completion call -# # try: -# # response = completion( -# # model="meta-llama/Llama-2-7b-chat-hf", -# # messages=messages, -# # custom_llm_provider="huggingface", -# # custom_api_base="https://s7c7gytn18vnu4tw.us-east-1.aws.endpoints.huggingface.cloud", -# # stream=True, -# # logger_fn=logger_fn, -# # ) -# # for chunk in response: -# # print(chunk["choices"][0]["delta"]) -# # score += 1 -# # except: -# # print(f"error occurred: {traceback.format_exc()}") -# # pass diff --git a/poetry.lock b/poetry.lock index 1c438e0eb..f4de9020a 100644 --- a/poetry.lock +++ b/poetry.lock @@ -338,6 +338,25 @@ files = [ {file = "idna-3.4.tar.gz", hash = "sha256:814f528e8dead7d329833b91c5faa87d60bf71824cd12a7530b5526063d02cb4"}, ] +[[package]] +name = "importlib-metadata" +version = "6.8.0" +description = "Read metadata from Python packages" +optional = false +python-versions = ">=3.8" +files = [ + {file = "importlib_metadata-6.8.0-py3-none-any.whl", hash = "sha256:3ebb78df84a805d7698245025b975d9d67053cd94c79245ba4b3eb694abe68bb"}, + {file = "importlib_metadata-6.8.0.tar.gz", hash = "sha256:dbace7892d8c0c4ac1ad096662232f831d4e64f4c4545bd53016a3e9d4654743"}, +] + +[package.dependencies] +zipp = ">=0.5" + +[package.extras] +docs = ["furo", "jaraco.packaging (>=9)", "jaraco.tidelift (>=1.4)", "rst.linker (>=1.9)", "sphinx (>=3.5)", "sphinx-lint"] +perf = ["ipython"] +testing = ["flufl.flake8", "importlib-resources (>=1.3)", "packaging", "pyfakefs", "pytest (>=6)", "pytest-black (>=0.3.7)", "pytest-checkdocs (>=2.4)", "pytest-cov", "pytest-enabler (>=2.2)", "pytest-mypy (>=0.9.1)", "pytest-perf (>=0.9.2)", "pytest-ruff"] + [[package]] name = "multidict" version = "6.0.4" @@ -744,7 +763,22 @@ files = [ idna = ">=2.0" multidict = ">=4.0" +[[package]] +name = "zipp" +version = "3.16.2" +description = "Backport of pathlib-compatible object wrapper for zip files" +optional = false +python-versions = ">=3.8" +files = [ + {file = "zipp-3.16.2-py3-none-any.whl", hash = "sha256:679e51dd4403591b2d6838a48de3d283f3d188412a9782faadf845f298736ba0"}, + {file = "zipp-3.16.2.tar.gz", hash = "sha256:ebc15946aa78bd63458992fc81ec3b6f7b1e92d51c35e6de1c3804e73b799147"}, +] + +[package.extras] +docs = ["furo", "jaraco.packaging (>=9.3)", "jaraco.tidelift (>=1.4)", "rst.linker (>=1.9)", "sphinx (>=3.5)", "sphinx-lint"] +testing = ["big-O", "jaraco.functools", "jaraco.itertools", "more-itertools", "pytest (>=6)", "pytest-black (>=0.3.7)", "pytest-checkdocs (>=2.4)", "pytest-cov", "pytest-enabler (>=2.2)", "pytest-ignore-flaky", "pytest-mypy (>=0.9.1)", "pytest-ruff"] + [metadata] lock-version = "2.0" python-versions = "^3.8" -content-hash = "fe7d88d91250950917244f8a6ffc8eba7bfc9aa84314ed6498131172ae4ef3cf" +content-hash = "de77e77aaa3ed490ffa159387c8e70e43361d78b095a975fec950336e54758e6"