Feat: Add Langtrace integration (#5341)

* Feat: Add Langtrace integration * add langtrace service name * fix timestamps for traces * add tests * Discard Callback + use existing otel logger * cleanup * remove print statments * remove callback * add docs * docs * add logging docs * format logging * remove emoji and add litellm proxy example * format logging * format `logging.md` * add langtrace docs to logging.md * sync conflict
2024-10-11 16:49:53 +03:00 · 2024-10-11 16:49:53 +03:00 · 7ec414a3cf
commit 7ec414a3cf
parent 42174fde4e
7 changed files with 291 additions and 0 deletions
--- a/docs/my-website/docs/observability/langtrace_integration.md
+++ b/docs/my-website/docs/observability/langtrace_integration.md
@ -0,0 +1,63 @@
 import Image from '@theme/IdealImage';
 # Langtrace AI
 Monitor, evaluate & improve your LLM apps
 ## Pre-Requisites
 Make an account on [Langtrace AI](https://langtrace.ai/login)
 ## Quick Start
 Use just 2 lines of code, to instantly log your responses **across all providers** with langtrace
 ```python
 litellm.callbacks = ["langtrace"]
 langtrace.init()
 ```
 ```python
 import litellm
 import os
 from langtrace_python_sdk import langtrace
 # Langtrace API Keys
 os.environ["LANGTRACE_API_KEY"] = "<your-api-key>"
 # LLM API Keys
 os.environ['OPENAI_API_KEY']="<openai-api-key>"
 # set langtrace as a callback, litellm will send the data to langtrace
 litellm.callbacks = ["langtrace"]
 #  init langtrace
 langtrace.init()
 # openai call
 response = completion(
    model="gpt-4o",
    messages=[
        {"content": "respond only in Yoda speak.", "role": "system"},
        {"content": "Hello, how are you?", "role": "user"},
    ],
 )
 print(response)
 ```
 ### Using with LiteLLM Proxy
 ```yaml
 model_list:
  - model_name: gpt-4
    litellm_params:
      model: openai/fake
      api_key: fake-key
      api_base: https://exampleopenaiendpoint-production.up.railway.app/
 litellm_settings:
  callbacks: ["langtrace"]
 environment_variables:
  LANGTRACE_API_KEY: "141a****"
 ```
--- a/docs/my-website/docs/proxy/logging.md
+++ b/docs/my-website/docs/proxy/logging.md
@ -1307,6 +1307,47 @@ curl --location 'http://0.0.0.0:4000/chat/completions' \
 Expect to see your log on Langfuse
 <Image img={require('../../img/langsmith_new.png')} />
 ## Logging LLM IO to Langtrace
 1. Set `success_callback: ["langtrace"]` on litellm config.yaml
 ```yaml
 model_list:
  - model_name: gpt-4
    litellm_params:
      model: openai/fake
      api_key: fake-key
      api_base: https://exampleopenaiendpoint-production.up.railway.app/
 litellm_settings:
  callbacks: ["langtrace"]
 environment_variables:
    LANGTRACE_API_KEY: "141a****"
 ```
 2. Start Proxy
 ```
 litellm --config /path/to/config.yaml
 ```
 3. Test it! 
 ```bash
 curl --location 'http://0.0.0.0:4000/chat/completions' \
 --header 'Content-Type: application/json' \
 --data ' {
      "model": "fake-openai-endpoint",
      "messages": [
        {
          "role": "user",
          "content": "Hello, Claude gm!"
        }
      ],
    }
 '
 ## Logging LLM IO to Galileo
 [BETA]
--- a/litellm/init.py
+++ b/litellm/init.py
@ -51,6 +51,7 @@ _custom_logger_compatible_callbacks_literal = Literal[
    "galileo",
    "braintrust",
    "arize",
    "langtrace",
    "gcs_bucket",
    "opik",
 ]
--- a/litellm/integrations/langtrace.py
+++ b/litellm/integrations/langtrace.py
@ -0,0 +1,108 @@
 import traceback
 import json
 from litellm.integrations.custom_logger import CustomLogger
 from litellm.proxy._types import SpanAttributes
 from typing import TYPE_CHECKING, Any, Optional, Union
 if TYPE_CHECKING:
    from opentelemetry.trace import Span as _Span
    Span = _Span
 else:
    Span = Any
 class LangtraceAttributes:
    """
    This class is used to save trace attributes to Langtrace's spans
    """
    def set_langtrace_attributes(self, span: Span, kwargs, response_obj):
        """
        This function is used to log the event to Langtrace
        """
        vendor = kwargs.get("litellm_params").get("custom_llm_provider")
        optional_params = kwargs.get("optional_params", {})
        options = {**kwargs, **optional_params}
        self.set_request_attributes(span, options, vendor)
        self.set_response_attributes(span, response_obj)
        self.set_usage_attributes(span, response_obj)
    def set_request_attributes(self, span: Span, kwargs, vendor):
        """
        This function is used to get span attributes for the LLM request
        """
        span_attributes = {
            "gen_ai.operation.name": "chat",
            "langtrace.service.name": vendor,
            SpanAttributes.LLM_REQUEST_MODEL.value: kwargs.get("model"),
            SpanAttributes.LLM_IS_STREAMING.value: kwargs.get("stream"),
            SpanAttributes.LLM_REQUEST_TEMPERATURE.value: kwargs.get("temperature"),
            SpanAttributes.LLM_TOP_K.value: kwargs.get("top_k"),
            SpanAttributes.LLM_REQUEST_TOP_P.value: kwargs.get("top_p"),
            SpanAttributes.LLM_USER.value: kwargs.get("user"),
            SpanAttributes.LLM_REQUEST_MAX_TOKENS.value: kwargs.get("max_tokens"),
            SpanAttributes.LLM_RESPONSE_STOP_REASON.value: kwargs.get("stop"),
            SpanAttributes.LLM_FREQUENCY_PENALTY.value: kwargs.get("frequency_penalty"),
            SpanAttributes.LLM_PRESENCE_PENALTY.value: kwargs.get("presence_penalty"),
        }
        prompts = kwargs.get("messages")
        if prompts:
            span.add_event(
                name="gen_ai.content.prompt",
                attributes={SpanAttributes.LLM_PROMPTS.value: json.dumps(prompts)},
            )
        self.set_span_attributes(span, span_attributes)
    def set_response_attributes(self, span: Span, response_obj):
        """
        This function is used to get span attributes for the LLM response
        """
        response_attributes = {
            "gen_ai.response_id": response_obj.get("id"),
            "gen_ai.system_fingerprint": response_obj.get("system_fingerprint"),
            SpanAttributes.LLM_RESPONSE_MODEL.value: response_obj.get("model"),
        }
        completions = []
        for choice in response_obj.get("choices", []):
            role = choice.get("message").get("role")
            content = choice.get("message").get("content")
            completions.append({"role": role, "content": content})
        span.add_event(
            name="gen_ai.content.completion",
            attributes={SpanAttributes.LLM_COMPLETIONS: json.dumps(completions)},
        )
        self.set_span_attributes(span, response_attributes)
    def set_usage_attributes(self, span: Span, response_obj):
        """
        This function is used to get span attributes for the LLM usage
        """
        usage = response_obj.get("usage")
        if usage:
            usage_attributes = {
                SpanAttributes.LLM_USAGE_PROMPT_TOKENS.value: usage.get(
                    "prompt_tokens"
                ),
                SpanAttributes.LLM_USAGE_COMPLETION_TOKENS.value: usage.get(
                    "completion_tokens"
                ),
                SpanAttributes.LLM_USAGE_TOTAL_TOKENS.value: usage.get("total_tokens"),
            }
            self.set_span_attributes(span, usage_attributes)
    def set_span_attributes(self, span: Span, attributes):
        """
        This function is used to set span attributes
        """
        for key, value in attributes.items():
            if not value:
                continue
            span.set_attribute(key, value)
--- a/litellm/integrations/opentelemetry.py
+++ b/litellm/integrations/opentelemetry.py
@ -352,6 +352,13 @@ class OpenTelemetry(CustomLogger):
                set_arize_ai_attributes(span, kwargs, response_obj)
                return
            elif self.callback_name == "langtrace":
                from litellm.integrations.langtrace import LangtraceAttributes
                LangtraceAttributes().set_langtrace_attributes(
                    span, kwargs, response_obj
                )
                return
            from litellm.proxy._types import SpanAttributes
            optional_params = kwargs.get("optional_params", {})
--- a/litellm/litellm_core_utils/litellm_logging.py
+++ b/litellm/litellm_core_utils/litellm_logging.py
@ -2531,6 +2531,31 @@ def _init_custom_logger_compatible_class(
            dynamic_rate_limiter_obj.update_variables(llm_router=llm_router)
        _in_memory_loggers.append(dynamic_rate_limiter_obj)
        return dynamic_rate_limiter_obj  # type: ignore
    elif logging_integration == "langtrace":
        if "LANGTRACE_API_KEY" not in os.environ:
            raise ValueError("LANGTRACE_API_KEY not found in environment variables")
        from litellm.integrations.opentelemetry import (
            OpenTelemetry,
            OpenTelemetryConfig,
        )
        otel_config = OpenTelemetryConfig(
            exporter="otlp_http",
            endpoint="https://langtrace.ai/api/trace",
        )
        os.environ["OTEL_EXPORTER_OTLP_TRACES_HEADERS"] = (
            f"api_key={os.getenv('LANGTRACE_API_KEY')}"
        )
        for callback in _in_memory_loggers:
            if (
                isinstance(callback, OpenTelemetry)
                and callback.callback_name == "langtrace"
            ):
                return callback  # type: ignore
        _otel_logger = OpenTelemetry(config=otel_config, callback_name="langtrace")
        _in_memory_loggers.append(_otel_logger)
        return _otel_logger  # type: ignore
 def get_custom_logger_compatible_class(
@ -2612,6 +2637,19 @@ def get_custom_logger_compatible_class(
        for callback in _in_memory_loggers:
            if isinstance(callback, _PROXY_DynamicRateLimitHandler):
                return callback  # type: ignore
    elif logging_integration == "langtrace":
        from litellm.integrations.opentelemetry import OpenTelemetry
        if "LANGTRACE_API_KEY" not in os.environ:
            raise ValueError("LANGTRACE_API_KEY not found in environment variables")
        for callback in _in_memory_loggers:
            if (
                isinstance(callback, OpenTelemetry)
                and callback.callback_name == "langtrace"
            ):
                return callback
    return None
--- a/litellm/tests/test_langtrace.py
+++ b/litellm/tests/test_langtrace.py
@ -0,0 +1,33 @@
 import os
 import sys
 import time
 import pytest
 from opentelemetry.sdk.trace.export.in_memory_span_exporter import InMemorySpanExporter
 from langtrace_python_sdk import langtrace
 import litellm
 sys.path.insert(0, os.path.abspath("../.."))
@pytest.fixture()
 def exporter():
    exporter = InMemorySpanExporter()
    langtrace.init(batch=False, custom_remote_exporter=exporter)
    litellm.success_callback = ["langtrace"]
    litellm.set_verbose = True
    return exporter
@pytest.mark.parametrize("model", ["claude-2.1", "gpt-3.5-turbo"])
 def test_langtrace_logging(exporter, model):
    litellm.completion(
        model=model,
        messages=[{"role": "user", "content": "This is a test"}],
        max_tokens=1000,
        temperature=0.7,
        timeout=5,
        mock_response="hi",
    )