Merge pull request #2363 from BerriAI/litellm_handle_circular_ref

(Fix) High Traffic Fix - handle litellm circular ref error
2024-03-06 12:38:01 -08:00 · 2024-03-06 12:38:01 -08:00 · 6c79bea177
commit 6c79bea177
parent 81b92f3434 c4079b2548
3 changed files with 67 additions and 9 deletions
--- a/litellm/integrations/langfuse.py
+++ b/litellm/integrations/langfuse.py
@ -265,8 +265,14 @@ class LangFuseLogger:
            cost = kwargs.get("response_cost", None)
            print_verbose(f"trace: {cost}")
-            if supports_tags:
+
            # Clean Metadata before logging - never log raw metadata
            # the raw metadata can contain circular references which leads to infinite recursion
            # we clean out all extra litellm metadata params before logging
            clean_metadata = {}
            if isinstance(metadata, dict):
                for key, value in metadata.items():
                    # generate langfuse tags
                    if key in [
                        "user_api_key",
                        "user_api_key_user_id",
@ -274,6 +280,19 @@ class LangFuseLogger:
                        "semantic-similarity",
                    ]:
                        tags.append(f"{key}:{value}")
                    # clean litellm metadata before logging
                    if key in [
                        "headers",
                        "endpoint",
                        "caching_groups",
                        "previous_models",
                    ]:
                        continue
                    else:
                        clean_metadata[key] = value
            if supports_tags:
                if "cache_hit" in kwargs:
                    if kwargs["cache_hit"] is None:
                        kwargs["cache_hit"] = False
@ -301,7 +320,7 @@ class LangFuseLogger:
                "input": input,
                "output": output,
                "usage": usage,
-                "metadata": metadata,
+                "metadata": clean_metadata,
                "level": level,
            }
--- a/litellm/integrations/s3.py
+++ b/litellm/integrations/s3.py
@ -104,6 +104,23 @@ class S3Logger:
            usage = response_obj["usage"]
            id = response_obj.get("id", str(uuid.uuid4()))
            # Clean Metadata before logging - never log raw metadata
            # the raw metadata can contain circular references which leads to infinite recursion
            # we clean out all extra litellm metadata params before logging
            clean_metadata = {}
            if isinstance(metadata, dict):
                for key, value in metadata.items():
                    # clean litellm metadata before logging
                    if key in [
                        "headers",
                        "endpoint",
                        "caching_groups",
                        "previous_models",
                    ]:
                        continue
                    else:
                        clean_metadata[key] = value
            # Build the initial payload
            payload = {
                "id": id,
@ -117,7 +134,7 @@ class S3Logger:
                "messages": messages,
                "response": response_obj,
                "usage": usage,
-                "metadata": metadata,
+                "metadata": clean_metadata,
            }
            # Ensure everything in the payload is converted to str
--- a/litellm/proxy/utils.py
+++ b/litellm/proxy/utils.py
@ -512,7 +512,11 @@ class PrismaClient:
        for k, v in db_data.items():
            if isinstance(v, dict):
                try:
                    db_data[k] = json.dumps(v)
                except:
                    # This avoids Prisma retrying this 5 times, and making 5 clients
                    db_data[k] = "failed-to-serialize-json"
        return db_data
    @backoff.on_exception(
@ -1641,10 +1645,28 @@ def get_logging_payload(kwargs, response_obj, start_time, end_time):
    if api_key is not None and isinstance(api_key, str) and api_key.startswith("sk-"):
        # hash the api_key
        api_key = hash_token(api_key)
-    if "headers" in metadata and "authorization" in metadata["headers"]:
+
-        metadata["headers"].pop(
+    # clean up litellm metadata
-            "authorization"
+    if isinstance(metadata, dict):
-        )  # do not store the original `sk-..` api key in the db
+        clean_metadata = {}
        verbose_proxy_logger.debug(
            f"getting payload for SpendLogs, available keys in metadata: "
            + str(list(metadata.keys()))
        )
        for key in metadata:
            if key in [
                "headers",
                "endpoint",
                "model_group",
                "deployment",
                "model_info",
                "caching_groups",
                "previous_models",
            ]:
                continue
            else:
                clean_metadata[key] = metadata[key]
    if litellm.cache is not None:
        cache_key = litellm.cache.get_cache_key(**kwargs)
    else:
@ -1668,7 +1690,7 @@ def get_logging_payload(kwargs, response_obj, start_time, end_time):
        "team_id": kwargs.get("litellm_params", {})
        .get("metadata", {})
        .get("user_api_key_team_id", ""),
-        "metadata": metadata,
+        "metadata": clean_metadata,
        "cache_key": cache_key,
        "spend": kwargs.get("response_cost", 0),
        "total_tokens": usage.get("total_tokens", 0),