fix(utils.py): more logging

2023-12-12 12:52:48 -08:00 · 2023-12-12 12:52:48 -08:00 · 1e970841a4
commit 1e970841a4
parent 632d6e0bff
4 changed files with 49 additions and 2 deletions
--- a/dist/litellm-1.12.6.dev3-py3-none-any.whl
+++ b/dist/litellm-1.12.6.dev3-py3-none-any.whl
--- a/dist/litellm-1.12.6.dev3.tar.gz
+++ b/dist/litellm-1.12.6.dev3.tar.gz
--- a/litellm/tests/test_completion.py
+++ b/litellm/tests/test_completion.py
@ -1084,7 +1084,52 @@ def test_completion_chat_sagemaker():
        assert len(complete_response) > 0
    except Exception as e:
        pytest.fail(f"Error occurred: {e}")
-test_completion_chat_sagemaker()
+# test_completion_chat_sagemaker()
 def test_completion_chat_sagemaker():
    try:
        messages = [{"role": "user", "content": "Hey, how's it going?"}]
        litellm.set_verbose=True
        response = completion(
            model="sagemaker/berri-benchmarking-Llama-2-70b-chat-hf-4", 
            messages=messages,
            max_tokens=100,
            temperature=0.7,
            stream=True,
        )
        # Add any assertions here to check the response 
        complete_response = "" 
        for chunk in response:
            complete_response += chunk.choices[0].delta.content or "" 
        print(f"complete_response: {complete_response}")
        assert len(complete_response) > 0
    except Exception as e:
        pytest.fail(f"Error occurred: {e}")
 import asyncio
@pytest.mark.asyncio
 async def test_completion_chat_sagemaker(): 
    try: 
        messages = [{"role": "user", "content": "Hey, how's it going?"}]
        litellm.set_verbose=True
        response = await litellm.acompletion(
            model="sagemaker/berri-benchmarking-Llama-2-70b-chat-hf-4", 
            messages=messages,
            max_tokens=100,
            temperature=0.7,
            stream=True,
        )
        # Add any assertions here to check the response 
        complete_response = "" 
        async for chunk in response:
            complete_response += chunk.choices[0].delta.content or "" 
        print(f"complete_response: {complete_response}")
        assert len(complete_response) > 0
    except: 
        pass
 asyncio.run(test_completion_chat_sagemaker())
 def test_completion_chat_sagemaker_mistral(): 
    try: 
--- a/litellm/utils.py
+++ b/litellm/utils.py
@ -5692,6 +5692,7 @@ class CustomStreamWrapper:
                if chunk is not None and chunk != b'':
                    print_verbose(f"PROCESSED CHUNK PRE CHUNK CREATOR: {chunk}")
                    response = self.chunk_creator(chunk=chunk)
                    print_verbose(f"PROCESSED CHUNK POST CHUNK CREATOR: {chunk}")
                    if response is None: 
                        continue
                    ## LOGGING
@ -5700,6 +5701,7 @@ class CustomStreamWrapper:
        except StopIteration:
            raise  # Re-raise StopIteration
        except Exception as e:
            print_verbose(f"HITS AN ERROR: {str(e)}")
            traceback_exception = traceback.format_exc()
            # LOG FAILURE - handle streaming failure logging in the _next_ object, remove `handle_failure` once it's deprecated
            threading.Thread(target=self.logging_obj.failure_handler, args=(e, traceback_exception)).start()
@ -5731,8 +5733,8 @@ class CustomStreamWrapper:
                # example - boto3 bedrock llms
                print_verbose(f"ENTERS __NEXT__ LOOP")
                processed_chunk = next(self)
                asyncio.create_task(self.logging_obj.async_success_handler(processed_chunk,))
                print_verbose(f"PROCESSED CHUNK IN __ANEXT__: {processed_chunk}")
                asyncio.create_task(self.logging_obj.async_success_handler(processed_chunk,))
                return processed_chunk
        except StopAsyncIteration:
            raise