fix(llm_guard.py): add streaming hook for moderation calls

2025-04-25 10:44:24 +00:00 · 2024-02-20 20:31:32 -08:00 · 2024-02-20 20:31:32 -08:00 · 49847347d0
commit 49847347d0
parent 0a5b8f0e4e
4 changed files with 36 additions and 25 deletions
--- a/litellm/utils.py
+++ b/litellm/utils.py
@ -909,20 +909,6 @@ class Logging:
                        f"LiteLLM.LoggingError: [Non-Blocking] Exception occurred while logging {traceback.format_exc()}"
                    )

-            if litellm.max_budget and self.stream:
-                start_time = self.start_time
-                end_time = (
-                    self.start_time
-                )  # no time has passed as the call hasn't been made yet
-                time_diff = (end_time - start_time).total_seconds()
-                float_diff = float(time_diff)
-                litellm._current_cost += litellm.completion_cost(
-                    model=self.model,
-                    prompt="".join(message["content"] for message in self.messages),
-                    completion="",
-                    total_time=float_diff,
-                )
-
            # Input Integration Logging -> If you want to log the fact that an attempt to call the model was made
            callbacks = litellm.input_callback + self.dynamic_input_callbacks
            for callback in callbacks: