(v0) use custom loggers

2024-02-15 13:21:04 -08:00 · 2024-02-15 13:21:04 -08:00 · 4489c2b898
commit 4489c2b898
parent 4f28d204ce
1 changed files with 106 additions and 0 deletions
--- a/enterprise/callbacks/api_callback.py
+++ b/enterprise/callbacks/api_callback.py
@ -0,0 +1,106 @@
+# callback to make a request to an API endpoint
+
+#### What this does ####
+#    On success, logs events to Promptlayer
+import dotenv, os
+import requests
+
+from litellm.proxy._types import UserAPIKeyAuth
+from litellm.caching import DualCache
+
+from typing import Literal, Union
+
+dotenv.load_dotenv()  # Loading env variables using dotenv
+import traceback
+
+
+#### What this does ####
+#    On success + failure, log events to Supabase
+
+import dotenv, os
+import requests
+
+dotenv.load_dotenv()  # Loading env variables using dotenv
+import traceback
+import datetime, subprocess, sys
+import litellm, uuid
+from litellm._logging import print_verbose, verbose_logger
+
+
+class GenericAPILogger:
+    # Class variables or attributes
+    def __init__(self, endpoint=None):
+        try:
+            verbose_logger.debug(f"in init GenericAPILogger, endpoint {endpoint}")
+
+            pass
+
+        except Exception as e:
+            print_verbose(f"Got exception on init GenericAPILogger client {str(e)}")
+            raise e
+
+    # This is sync, because we run this in a separate thread. Running in a sepearate thread ensures it will never block an LLM API call
+    # Experience with s3, Langfuse shows that async logging events are complicated and can block LLM calls
+    def log_event(self, kwargs, response_obj, start_time, end_time, print_verbose):
+        try:
+            verbose_logger.debug(
+                f"s3 Logging - Enters logging function for model {kwargs}"
+            )
+
+            # construct payload to send custom logger
+            # follows the same params as langfuse.py
+            litellm_params = kwargs.get("litellm_params", {})
+            metadata = (
+                litellm_params.get("metadata", {}) or {}
+            )  # if litellm_params['metadata'] == None
+            messages = kwargs.get("messages")
+            optional_params = kwargs.get("optional_params", {})
+            call_type = kwargs.get("call_type", "litellm.completion")
+            cache_hit = kwargs.get("cache_hit", False)
+            usage = response_obj["usage"]
+            id = response_obj.get("id", str(uuid.uuid4()))
+
+            # Build the initial payload
+            payload = {
+                "id": id,
+                "call_type": call_type,
+                "cache_hit": cache_hit,
+                "startTime": start_time,
+                "endTime": end_time,
+                "model": kwargs.get("model", ""),
+                "user": kwargs.get("user", ""),
+                "modelParameters": optional_params,
+                "messages": messages,
+                "response": response_obj,
+                "usage": usage,
+                "metadata": metadata,
+            }
+
+            # Ensure everything in the payload is converted to str
+            for key, value in payload.items():
+                try:
+                    payload[key] = str(value)
+                except:
+                    # non blocking if it can't cast to a str
+                    pass
+
+            import json
+
+            payload = json.dumps(payload)
+
+            print_verbose(f"\nGeneric Logger - Logging payload = {payload}")
+
+            # make request to endpoint with payload
+            response = requests.post(self.endpoint, data=payload, headers=self.headers)
+
+            response_status = response.status_code
+            response_text = response.text
+
+            print_verbose(
+                f"Generic Logger - final response status = {response_status}, response text = {response_text}"
+            )
+            return response
+        except Exception as e:
+            traceback.print_exc()
+            verbose_logger.debug(f"Generic - {str(e)}\n{traceback.format_exc()}")
+            pass