openai-ergonomic 0.5.2

//! Langfuse interceptor for OpenTelemetry-based LLM observability.
//!
//! This interceptor automatically instruments `OpenAI` API calls with OpenTelemetry spans.
//! You must configure the OpenTelemetry tracer with Langfuse exporter separately.
//!
//! # Usage
//!
//! ```no_run
//! # use openai_ergonomic::{Builder, Client};
//! # use openai_ergonomic::langfuse_interceptor::{LangfuseInterceptor, LangfuseConfig};
//! # use opentelemetry_langfuse::ExporterBuilder;
//! # use opentelemetry_sdk::runtime::Tokio;
//! # use opentelemetry_sdk::trace::span_processor_with_async_runtime::BatchSpanProcessor;
//! # use opentelemetry_sdk::trace::SdkTracerProvider;
//! # use opentelemetry::global;
//! # use opentelemetry::trace::TracerProvider;
//! # async fn example() -> Result<(), Box<dyn std::error::Error>> {
//! // 1. Build Langfuse exporter
//! let exporter = ExporterBuilder::from_env()?.build()?;
//!
//! // 2. Create tracer provider
//! let provider = SdkTracerProvider::builder()
//!     .with_span_processor(BatchSpanProcessor::builder(exporter, Tokio).build())
//!     .build();
//!
//! global::set_tracer_provider(provider.clone());
//!
//! // 3. Create interceptor with tracer
//! let tracer = provider.tracer("openai-ergonomic");
//! let interceptor = LangfuseInterceptor::new(tracer, LangfuseConfig::new());
//! let client = Client::from_env()?
//!     .with_interceptor(Box::new(interceptor))
//!     .build();
//!
//! // Traces are automatically sent to Langfuse
//! let response = client.send_chat(client.chat_simple("Hello!")).await?;
//! # Ok(())
//! # }
//! ```

use crate::interceptor::{
    AfterResponseContext, BeforeRequestContext, ErrorContext, Interceptor, StreamChunkContext,
    StreamEndContext,
};
use crate::Result;
use opentelemetry::{
    trace::{SpanKind, Tracer},
    KeyValue,
};
use opentelemetry_langfuse::LangfuseContext;
use opentelemetry_semantic_conventions::attribute::{
    GEN_AI_OPERATION_NAME, GEN_AI_REQUEST_MAX_TOKENS, GEN_AI_REQUEST_MODEL,
    GEN_AI_REQUEST_TEMPERATURE, GEN_AI_RESPONSE_ID, GEN_AI_SYSTEM, GEN_AI_USAGE_INPUT_TOKENS,
    GEN_AI_USAGE_OUTPUT_TOKENS,
};
use serde_json::Value;
use std::sync::{Arc, Mutex};
use tracing::{debug, error, info};

/// State managed by the Langfuse interceptor across the request lifecycle.
///
/// This state is passed through the interceptor hooks to maintain
/// span information without requiring global state.
///
/// Uses `Mutex` for interior mutability to ensure thread-safety in async contexts.
///
/// The generic type `S` is the Span type from the tracer.
pub struct LangfuseState<S = opentelemetry::global::BoxedSpan> {
    /// The active span for this request (uses Mutex for thread-safe interior mutability)
    pub(crate) span: Mutex<Option<S>>,
}

impl<S> Default for LangfuseState<S> {
    fn default() -> Self {
        Self {
            span: Mutex::new(None),
        }
    }
}

/// Configuration for the Langfuse interceptor.
#[derive(Debug, Clone)]
pub struct LangfuseConfig {
    /// Enable debug logging
    pub debug: bool,
}

impl Default for LangfuseConfig {
    fn default() -> Self {
        Self {
            debug: std::env::var("LANGFUSE_DEBUG")
                .unwrap_or_else(|_| "false".to_string())
                .parse()
                .unwrap_or(false),
        }
    }
}

impl LangfuseConfig {
    /// Create a new configuration.
    pub fn new() -> Self {
        Self::default()
    }

    /// Enable debug logging.
    #[must_use]
    pub fn with_debug(mut self, debug: bool) -> Self {
        self.debug = debug;
        self
    }
}

/// Langfuse interceptor for OpenTelemetry-based observability.
///
/// This interceptor automatically creates spans for API calls.
/// Spans are maintained across `before_request` and `after_response` using a global registry
/// and request metadata, requiring no user code changes.
///
/// The tracer must be configured externally - this interceptor only instruments API calls.
pub struct LangfuseInterceptor<T: Tracer + Send + Sync> {
    config: LangfuseConfig,
    tracer: Arc<T>,
    context: Arc<LangfuseContext>,
}

impl<T: Tracer + Send + Sync> LangfuseInterceptor<T>
where
    T::Span: Send + Sync + 'static,
{
    /// Create a new Langfuse interceptor with the given tracer.
    ///
    /// The tracer should be configured to export to Langfuse using
    /// `opentelemetry_langfuse::ExporterBuilder`.
    ///
    /// # Example
    ///
    /// ```no_run
    /// use opentelemetry::global;
    /// use opentelemetry::trace::TracerProvider;
    /// use opentelemetry_langfuse::ExporterBuilder;
    /// use opentelemetry_sdk::runtime::Tokio;
    /// use opentelemetry_sdk::trace::span_processor_with_async_runtime::BatchSpanProcessor;
    /// use opentelemetry_sdk::trace::SdkTracerProvider;
    ///
    /// # async fn setup() -> Result<(), Box<dyn std::error::Error>> {
    /// // Build exporter
    /// let exporter = ExporterBuilder::from_env()?.build()?;
    ///
    /// // Create tracer provider with batch processor
    /// let provider = SdkTracerProvider::builder()
    ///     .with_span_processor(BatchSpanProcessor::builder(exporter, Tokio).build())
    ///     .build();
    ///
    /// // Set as global provider
    /// global::set_tracer_provider(provider.clone());
    ///
    /// // Get tracer for interceptor
    /// let tracer = provider.tracer("openai-ergonomic");
    ///
    /// // Create interceptor with tracer
    /// use openai_ergonomic::langfuse_interceptor::{LangfuseInterceptor, LangfuseConfig};
    /// let interceptor = LangfuseInterceptor::new(tracer, LangfuseConfig::new());
    /// # Ok(())
    /// # }
    /// ```
    pub fn new(tracer: T, config: LangfuseConfig) -> Self {
        if config.debug {
            info!("Langfuse interceptor initialized");
        }

        Self {
            config,
            tracer: Arc::new(tracer),
            context: Arc::new(LangfuseContext::new()),
        }
    }

    /// Set the session ID for traces created by this interceptor.
    pub fn set_session_id(&self, session_id: impl Into<String>) {
        self.context.set_session_id(session_id);
    }

    /// Set the user ID for traces created by this interceptor.
    pub fn set_user_id(&self, user_id: impl Into<String>) {
        self.context.set_user_id(user_id);
    }

    /// Add tags to traces created by this interceptor.
    pub fn add_tags(&self, tags: Vec<String>) {
        self.context.add_tags(tags);
    }

    /// Add a single tag to traces created by this interceptor.
    pub fn add_tag(&self, tag: impl Into<String>) {
        self.context.add_tag(tag);
    }

    /// Set metadata for traces created by this interceptor.
    pub fn set_metadata(&self, metadata: serde_json::Value) {
        self.context.set_metadata(metadata);
    }

    /// Clear all context attributes.
    pub fn clear_context(&self) {
        self.context.clear();
    }

    /// Get a reference to the Langfuse context.
    pub fn context(&self) -> &Arc<LangfuseContext> {
        &self.context
    }

    /// Extract request parameters from JSON.
    fn extract_request_params(request_json: &str) -> serde_json::Result<Value> {
        serde_json::from_str(request_json)
    }
}

#[async_trait::async_trait]
impl<T: Tracer + Send + Sync> Interceptor<LangfuseState<T::Span>> for LangfuseInterceptor<T>
where
    T::Span: Send + Sync + 'static,
{
    async fn before_request(
        &self,
        ctx: &mut BeforeRequestContext<'_, LangfuseState<T::Span>>,
    ) -> Result<()> {
        let tracer = self.tracer.as_ref();

        // Build initial attributes
        let mut attributes = vec![
            KeyValue::new(GEN_AI_SYSTEM, "openai"),
            KeyValue::new(GEN_AI_OPERATION_NAME, ctx.operation.to_string()),
            KeyValue::new(GEN_AI_REQUEST_MODEL, ctx.model.to_string()),
        ];

        // Add Langfuse context attributes from this interceptor's context
        attributes.extend(self.context.get_attributes());

        // Parse request JSON and add relevant attributes
        if let Ok(params) = Self::extract_request_params(ctx.request_json) {
            if let Some(temperature) = params
                .get("temperature")
                .and_then(serde_json::Value::as_f64)
            {
                attributes.push(KeyValue::new(GEN_AI_REQUEST_TEMPERATURE, temperature));
            }
            if let Some(max_tokens) = params.get("max_tokens").and_then(serde_json::Value::as_i64) {
                attributes.push(KeyValue::new(GEN_AI_REQUEST_MAX_TOKENS, max_tokens));
            }

            // Add messages as gen_ai.prompt attributes
            if let Some(messages) = params.get("messages").and_then(serde_json::Value::as_array) {
                for (i, message) in messages.iter().enumerate() {
                    if let Some(obj) = message.as_object() {
                        let role = obj
                            .get("role")
                            .and_then(serde_json::Value::as_str)
                            .unwrap_or("unknown")
                            .to_string();
                        let content = obj
                            .get("content")
                            .and_then(serde_json::Value::as_str)
                            .unwrap_or("")
                            .to_string();

                        attributes.push(KeyValue::new(format!("gen_ai.prompt.{i}.role"), role));
                        attributes
                            .push(KeyValue::new(format!("gen_ai.prompt.{i}.content"), content));
                    }
                }
            }
        }

        // Create span and store it in state
        let span = tracer
            .span_builder(ctx.operation.to_string())
            .with_kind(SpanKind::Client)
            .with_attributes(attributes)
            .start(tracer);

        // Store span directly in state
        *ctx.state.span.lock().unwrap() = Some(span);

        if self.config.debug {
            debug!("Started Langfuse span for operation: {}", ctx.operation);
        }

        Ok(())
    }

    async fn after_response(
        &self,
        ctx: &AfterResponseContext<'_, LangfuseState<T::Span>>,
    ) -> Result<()> {
        use opentelemetry::trace::Span;

        // Take the span from state so we can end it
        let Some(mut span) = ctx.state.span.lock().unwrap().take() else {
            if self.config.debug {
                debug!("No span found in state for operation: {}", ctx.operation);
            }
            return Ok(());
        };

        // Add response attributes to the span

        #[allow(clippy::cast_possible_truncation)]
        {
            span.set_attribute(KeyValue::new(
                "duration_ms",
                ctx.duration.as_millis() as i64,
            ));
        }

        // Add usage metrics if available
        if let Some(input_tokens) = ctx.input_tokens {
            span.set_attribute(KeyValue::new(GEN_AI_USAGE_INPUT_TOKENS, input_tokens));
        }
        if let Some(output_tokens) = ctx.output_tokens {
            span.set_attribute(KeyValue::new(GEN_AI_USAGE_OUTPUT_TOKENS, output_tokens));
        }

        // Parse response and add completion content
        if let Ok(response) = Self::extract_request_params(ctx.response_json) {
            // Add response ID if available
            if let Some(id) = response.get("id").and_then(serde_json::Value::as_str) {
                span.set_attribute(KeyValue::new(GEN_AI_RESPONSE_ID, id.to_string()));
            }

            // Add completion content
            if let Some(choices) = response
                .get("choices")
                .and_then(serde_json::Value::as_array)
            {
                for (i, choice) in choices.iter().enumerate() {
                    if let Some(message) = choice.get("message") {
                        if let Some(role) = message.get("role").and_then(serde_json::Value::as_str)
                        {
                            span.set_attribute(KeyValue::new(
                                format!("gen_ai.completion.{i}.role"),
                                role.to_string(),
                            ));
                        }
                        if let Some(content) =
                            message.get("content").and_then(serde_json::Value::as_str)
                        {
                            span.set_attribute(KeyValue::new(
                                format!("gen_ai.completion.{i}.content"),
                                content.to_string(),
                            ));
                        }
                    }
                }
            }
        }

        // End the span
        span.end();

        if self.config.debug {
            debug!("Completed Langfuse span for operation: {}", ctx.operation);
        }

        Ok(())
    }

    async fn on_stream_chunk(
        &self,
        _ctx: &StreamChunkContext<'_, LangfuseState<T::Span>>,
    ) -> Result<()> {
        // Stream chunks can add attributes to the current span if needed
        // For now, we just let them pass through
        Ok(())
    }

    async fn on_stream_end(
        &self,
        ctx: &StreamEndContext<'_, LangfuseState<T::Span>>,
    ) -> Result<()> {
        use opentelemetry::trace::Span;

        // Take the span from state so we can end it
        let Some(mut span) = ctx.state.span.lock().unwrap().take() else {
            if self.config.debug {
                debug!(
                    "No span found in state for stream operation: {}",
                    ctx.operation
                );
            }
            return Ok(());
        };

        // Add final streaming attributes

        #[allow(clippy::cast_possible_truncation, clippy::cast_possible_wrap)]
        {
            span.set_attribute(KeyValue::new(
                "stream.total_chunks",
                ctx.total_chunks as i64,
            ));
            span.set_attribute(KeyValue::new(
                "stream.duration_ms",
                ctx.duration.as_millis() as i64,
            ));
        }

        if let Some(input_tokens) = ctx.input_tokens {
            span.set_attribute(KeyValue::new(GEN_AI_USAGE_INPUT_TOKENS, input_tokens));
        }
        if let Some(output_tokens) = ctx.output_tokens {
            span.set_attribute(KeyValue::new(GEN_AI_USAGE_OUTPUT_TOKENS, output_tokens));
        }

        // End the span
        span.end();

        if self.config.debug {
            info!(
                "Completed streaming span for operation: {} with {} chunks",
                ctx.operation, ctx.total_chunks
            );
        }

        Ok(())
    }

    async fn on_error(&self, ctx: &ErrorContext<'_, LangfuseState<T::Span>>) {
        use opentelemetry::trace::{Span, Status};

        // Take the span from state if available
        let Some(state) = ctx.state else {
            if self.config.debug {
                debug!(
                    "No state available for error in operation: {}",
                    ctx.operation
                );
            }
            return;
        };

        let Some(mut span) = state.span.lock().unwrap().take() else {
            if self.config.debug {
                debug!(
                    "No span found in state for error in operation: {}",
                    ctx.operation
                );
            }
            return;
        };

        // Set the span status to error
        span.set_status(Status::error(ctx.error.to_string()));

        // Add error attributes to the span
        span.set_attribute(KeyValue::new("error.type", format!("{:?}", ctx.error)));
        span.set_attribute(KeyValue::new("error.message", ctx.error.to_string()));

        if let Some(model) = ctx.model {
            span.set_attribute(KeyValue::new(GEN_AI_REQUEST_MODEL, model.to_string()));
        }

        // End the span
        span.end();

        if self.config.debug {
            error!(
                "Recorded error for operation {}: {}",
                ctx.operation, ctx.error
            );
        }
    }
}

// Implement Interceptor for Arc<LangfuseInterceptor<T>> to allow sharing the interceptor
#[async_trait::async_trait]
impl<T: Tracer + Send + Sync> Interceptor<LangfuseState<T::Span>> for Arc<LangfuseInterceptor<T>>
where
    T::Span: Send + Sync + 'static,
{
    async fn before_request(
        &self,
        ctx: &mut BeforeRequestContext<'_, LangfuseState<T::Span>>,
    ) -> Result<()> {
        (**self).before_request(ctx).await
    }

    async fn after_response(
        &self,
        ctx: &AfterResponseContext<'_, LangfuseState<T::Span>>,
    ) -> Result<()> {
        (**self).after_response(ctx).await
    }

    async fn on_stream_chunk(
        &self,
        ctx: &StreamChunkContext<'_, LangfuseState<T::Span>>,
    ) -> Result<()> {
        (**self).on_stream_chunk(ctx).await
    }

    async fn on_stream_end(
        &self,
        ctx: &StreamEndContext<'_, LangfuseState<T::Span>>,
    ) -> Result<()> {
        (**self).on_stream_end(ctx).await
    }

    async fn on_error(&self, ctx: &ErrorContext<'_, LangfuseState<T::Span>>) {
        (**self).on_error(ctx).await;
    }
}

#[cfg(test)]
mod tests {
    use super::*;
    use opentelemetry::trace::noop::NoopTracer;

    #[test]
    fn test_config_from_env() {
        std::env::set_var("LANGFUSE_DEBUG", "true");

        let config = LangfuseConfig::default();
        assert!(config.debug);

        // Cleanup
        std::env::remove_var("LANGFUSE_DEBUG");
    }

    #[test]
    fn test_interceptor_creation() {
        let tracer = NoopTracer::new();
        let config = LangfuseConfig::new().with_debug(true);
        let _interceptor = LangfuseInterceptor::new(tracer, config);
        // No assertion needed - just verify it compiles and constructs
    }
}