debtmap 0.17.0 - Docs.rs

//! Complexity attribution analysis.
//!
//! This module provides tools for attributing complexity metrics to specific
//! source code constructs, distinguishing between logical complexity,
//! formatting artifacts, and recognized patterns.

use crate::core::FunctionMetrics;
use serde::{Deserialize, Serialize};

/// Tracks changes in complexity between analysis runs.
///
/// Compares current analysis results with previous runs to identify
/// complexity trends and categorize changes.
pub mod change_tracker;
/// Pattern detection and complexity adjustment.
///
/// Identifies recognized patterns (error handling, validation, data transformation)
/// and adjusts complexity scores based on pattern familiarity.
pub mod pattern_tracker;
/// Complexity source tracking and classification.
///
/// Tracks the origin of complexity contributions, distinguishing logical
/// structure from formatting artifacts.
pub mod source_tracker;

use self::pattern_tracker::PatternTracker;
use self::source_tracker::{ComplexitySourceType, SourceTracker};

/// Estimated location information for complexity mapping
#[derive(Debug, Clone)]
struct EstimatedComplexityLocation {
    line: u32,
    column: u32,
    span: Option<(u32, u32)>,
    construct_type: String,
    context: String,
}

/// Core attribution engine for complexity source analysis
pub struct AttributionEngine {
    #[allow(dead_code)]
    source_trackers: Vec<Box<dyn SourceTracker>>,
    pattern_tracker: PatternTracker,
}

impl AttributionEngine {
    /// Creates a new attribution engine with default source trackers.
    ///
    /// Initializes the engine with trackers for logical structure complexity
    /// and formatting artifacts, plus a pattern tracker for recognized patterns.
    pub fn new() -> Self {
        Self {
            source_trackers: vec![
                Box::new(source_tracker::LogicalStructureTracker::new()),
                Box::new(source_tracker::FormattingArtifactTracker::new()),
            ],
            pattern_tracker: PatternTracker::new(),
        }
    }

    /// Attributes complexity between logical structure, formatting, and patterns.
    ///
    /// Compares raw and normalized complexity results to identify how much
    /// complexity comes from true logical structure versus formatting artifacts
    /// or recognized patterns. Returns a complete attribution analysis.
    pub fn attribute(
        &self,
        raw_result: &super::multi_pass::ComplexityResult,
        normalized_result: &super::multi_pass::ComplexityResult,
    ) -> ComplexityAttribution {
        // Calculate logical complexity from normalized result
        let logical_complexity = self.calculate_logical_complexity(normalized_result);

        // Calculate formatting artifacts as difference between raw and normalized
        let formatting_artifacts =
            self.calculate_formatting_artifacts(raw_result, normalized_result);

        // Analyze patterns in the code
        let pattern_complexity = self
            .pattern_tracker
            .analyze_patterns(&normalized_result.functions);

        // Generate source mappings
        let source_mappings = self.generate_source_mappings(&raw_result.functions);

        ComplexityAttribution {
            logical_complexity,
            formatting_artifacts,
            pattern_complexity,
            source_mappings,
        }
    }

    fn calculate_logical_complexity(
        &self,
        normalized_result: &super::multi_pass::ComplexityResult,
    ) -> AttributedComplexity {
        let mut total = 0u32;
        let mut breakdown = Vec::new();

        for func in &normalized_result.functions {
            total += func.cyclomatic;

            breakdown.push(ComplexityComponent {
                source_type: ComplexitySourceType::LogicalStructure {
                    construct_type: LogicalConstruct::Function,
                    nesting_level: func.nesting,
                },
                contribution: func.cyclomatic,
                location: CodeLocation {
                    file: func.file.to_string_lossy().to_string(),
                    line: func.line as u32,
                    column: 0,
                    span: None,
                },
                description: format!("Function: {}", func.name),
                suggestions: if func.cyclomatic > 10 {
                    vec![
                        "Consider breaking down this function".to_string(),
                        "Extract complex conditions into helper functions".to_string(),
                    ]
                } else {
                    vec![]
                },
            });
        }

        AttributedComplexity {
            total,
            breakdown,
            confidence: 0.9, // High confidence for logical complexity
        }
    }

    fn calculate_formatting_artifacts(
        &self,
        raw_result: &super::multi_pass::ComplexityResult,
        normalized_result: &super::multi_pass::ComplexityResult,
    ) -> AttributedComplexity {
        let raw_total = raw_result.total_complexity;
        let normalized_total = normalized_result.total_complexity;

        let artifact_total = raw_total.saturating_sub(normalized_total);

        let mut breakdown = Vec::new();

        // Compare function-by-function to identify formatting artifacts
        for (raw_func, norm_func) in raw_result
            .functions
            .iter()
            .zip(normalized_result.functions.iter())
        {
            let diff = raw_func.cyclomatic.saturating_sub(norm_func.cyclomatic);

            if diff > 0 {
                breakdown.push(ComplexityComponent {
                    source_type: ComplexitySourceType::FormattingArtifact {
                        artifact_type: FormattingArtifact::MultilineExpression,
                        severity: ArtifactSeverity::Medium,
                    },
                    contribution: diff,
                    location: CodeLocation {
                        file: raw_func.file.to_string_lossy().to_string(),
                        line: raw_func.line as u32,
                        column: 0,
                        span: None,
                    },
                    description: format!("Formatting in function: {}", raw_func.name),
                    suggestions: vec![
                        "Use consistent formatting".to_string(),
                        "Consider automated formatting tools".to_string(),
                    ],
                });
            }
        }

        AttributedComplexity {
            total: artifact_total,
            breakdown,
            confidence: 0.75, // Medium-high confidence for formatting artifacts
        }
    }

    fn generate_source_mappings(&self, functions: &[FunctionMetrics]) -> Vec<SourceMapping> {
        let mut mappings = Vec::new();

        for func in functions {
            // Create a base mapping for the function
            mappings.push(SourceMapping {
                complexity_point: 1,
                location: CodeLocation {
                    file: func.file.to_string_lossy().to_string(),
                    line: func.line as u32,
                    column: 0,
                    span: Some((func.line as u32, (func.line + func.length) as u32)),
                },
                ast_path: vec![
                    "module".to_string(),
                    "function".to_string(),
                    func.name.clone(),
                ],
                context: format!("Function definition: {}", func.name),
            });

            // Generate estimated mappings for complexity points
            // In a full implementation, this would use AST analysis
            let estimated_complexity_points = self.estimate_complexity_locations(func);

            for (point, location_info) in estimated_complexity_points.into_iter().enumerate() {
                if point > 0 {
                    // Skip first point since it's already added above
                    mappings.push(SourceMapping {
                        complexity_point: (point + 1) as u32,
                        location: CodeLocation {
                            file: func.file.to_string_lossy().to_string(),
                            line: location_info.line,
                            column: location_info.column,
                            span: location_info.span,
                        },
                        ast_path: vec![
                            "module".to_string(),
                            "function".to_string(),
                            func.name.clone(),
                            location_info.construct_type,
                        ],
                        context: location_info.context,
                    });
                }
            }
        }

        mappings
    }

    /// Estimate complexity locations within a function
    /// In a full implementation, this would parse the AST to find actual control flow constructs
    fn estimate_complexity_locations(
        &self,
        func: &FunctionMetrics,
    ) -> Vec<EstimatedComplexityLocation> {
        let mut locations = Vec::new();

        // Create estimated locations based on function properties
        let _complexity_per_line = if func.length > 0 {
            func.cyclomatic as f32 / func.length as f32
        } else {
            1.0
        };

        let mut current_line = func.line;
        let line_step = if func.cyclomatic > 1 && func.length > 1 {
            func.length / (func.cyclomatic as usize).max(1)
        } else {
            1
        };

        for i in 0..func.cyclomatic {
            locations.push(EstimatedComplexityLocation {
                line: current_line as u32,
                column: if i == 0 { 0 } else { 4 }, // Estimate indentation
                span: Some((current_line as u32, current_line as u32)),
                construct_type: if i == 0 {
                    "function_signature".to_string()
                } else {
                    format!("control_flow_{}", i)
                },
                context: if i == 0 {
                    format!("Function signature for {}", func.name)
                } else {
                    format!("Control flow construct #{} in {}", i, func.name)
                },
            });
            current_line += line_step;
        }

        locations
    }
}

impl Default for AttributionEngine {
    fn default() -> Self {
        Self::new()
    }
}

/// Complete complexity attribution analysis.
///
/// Breaks down total complexity into distinct categories: logical structure,
/// formatting artifacts, and recognized patterns. Includes source mappings
/// for precise code location tracking.
#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct ComplexityAttribution {
    /// Complexity from true logical control flow and structure.
    pub logical_complexity: AttributedComplexity,
    /// Complexity from formatting choices that inflate raw metrics.
    pub formatting_artifacts: AttributedComplexity,
    /// Complexity from recognized patterns with adjusted scores.
    pub pattern_complexity: AttributedComplexity,
    /// Mappings from complexity points back to source code locations.
    pub source_mappings: Vec<SourceMapping>,
}

/// Attributed complexity with breakdown.
///
/// Represents a category of complexity (logical, formatting, or pattern-based)
/// with detailed breakdown of individual components and confidence level.
#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct AttributedComplexity {
    /// Total complexity score for this category.
    pub total: u32,
    /// Individual components contributing to the total.
    pub breakdown: Vec<ComplexityComponent>,
    /// Confidence level in the attribution (0.0 to 1.0).
    pub confidence: f32,
}

/// Individual complexity component with source attribution.
///
/// Represents a single contributor to complexity, tracking its source type,
/// contribution amount, code location, and any improvement suggestions.
#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct ComplexityComponent {
    /// The type of complexity source (logical structure, formatting, or pattern).
    pub source_type: ComplexitySourceType,
    /// Numeric contribution to the total complexity score.
    pub contribution: u32,
    /// Source code location where this complexity originates.
    pub location: CodeLocation,
    /// Human-readable description of the complexity source.
    pub description: String,
    /// Suggested improvements to reduce this complexity.
    pub suggestions: Vec<String>,
}

/// Mapping from a complexity point back to source code.
///
/// Provides precise traceability from computed complexity metrics
/// to their originating source code constructs via AST path.
#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct SourceMapping {
    /// The complexity point index being mapped.
    pub complexity_point: u32,
    /// Source code location for this complexity point.
    pub location: CodeLocation,
    /// Path through the AST to reach this construct (e.g., `["module", "function", "if"]`).
    pub ast_path: Vec<String>,
    /// Human-readable context describing what this mapping represents.
    pub context: String,
}

/// Source code location information.
///
/// Identifies a specific position in a source file, optionally with a span
/// for multi-line constructs.
#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct CodeLocation {
    /// Path to the source file.
    pub file: String,
    /// Line number (1-indexed).
    pub line: u32,
    /// Column number (0-indexed).
    pub column: u32,
    /// Optional span as (start_line, end_line) for multi-line constructs.
    pub span: Option<(u32, u32)>,
}

/// Types of logical constructs that contribute to complexity.
///
/// These are control flow and structural elements that represent
/// genuine logical complexity in the code.
#[derive(Debug, Clone, Serialize, Deserialize, PartialEq)]
pub enum LogicalConstruct {
    /// Function or method definition.
    Function,
    /// Conditional branch (if/else).
    If,
    /// Iteration construct (for, while, loop).
    Loop,
    /// Pattern matching expression.
    Match,
    /// Error handling block (try/catch in other languages, `?` in Rust).
    Try,
    /// Closure or lambda expression.
    Closure,
}

/// Types of formatting artifacts that inflate raw complexity metrics.
///
/// These are stylistic choices that don't represent actual logical
/// complexity but may affect raw line-based metrics.
#[derive(Debug, Clone, Serialize, Deserialize, PartialEq)]
pub enum FormattingArtifact {
    /// Expression split across multiple lines.
    MultilineExpression,
    /// Unnecessary blank lines or spacing.
    ExcessiveWhitespace,
    /// Mixed or inconsistent indentation style.
    InconsistentIndentation,
    /// Redundant parentheses around expressions.
    UnnecessaryParentheses,
    /// Unusual line break placement.
    LineBreakPattern,
}

/// Severity level of formatting artifacts.
///
/// Indicates how much the artifact inflates complexity metrics.
#[derive(Debug, Clone, Serialize, Deserialize, PartialEq)]
pub enum ArtifactSeverity {
    /// Minor impact on metrics (1-2 points).
    Low,
    /// Moderate impact on metrics (3-5 points).
    Medium,
    /// Significant impact on metrics (6+ points).
    High,
}

/// Recognized code patterns that have adjusted complexity scoring.
///
/// When these patterns are detected, complexity scores may be adjusted
/// since the pattern is well-understood and familiar to developers.
#[derive(Debug, Clone, Serialize, Deserialize, PartialEq, Eq, Hash)]
pub enum RecognizedPattern {
    /// Result/Option handling chains.
    ErrorHandling,
    /// Input validation and sanitization.
    Validation,
    /// Data mapping and transformation pipelines.
    DataTransformation,
    /// Mutable state management.
    StateManagement,
    /// Iterator and collection operations.
    Iterator,
    /// Builder pattern for object construction.
    Builder,
    /// Factory pattern for object creation.
    Factory,
    /// Observer/listener pattern for event handling.
    Observer,
}

/// Language-specific features that affect complexity analysis.
///
/// These features require special handling during analysis since
/// they have different complexity characteristics per language.
#[derive(Debug, Clone, Serialize, Deserialize, PartialEq)]
pub enum LanguageFeature {
    /// Async/await syntax for asynchronous code.
    AsyncAwait,
    /// Pattern matching (Rust `match`, Python `match`).
    PatternMatching,
    /// Generic type parameters and constraints.
    Generics,
    /// Macro invocations (Rust macros, C preprocessor).
    Macros,
    /// Decorators/attributes (Python decorators, Rust attributes).
    Decorators,
    /// List/dict comprehensions (Python).
    Comprehensions,
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn test_attribution_engine_new() {
        let engine = AttributionEngine::new();
        assert!(!engine.source_trackers.is_empty());
    }

    #[test]
    fn test_attributed_complexity() {
        let complexity = AttributedComplexity {
            total: 10,
            breakdown: vec![],
            confidence: 0.8,
        };

        assert_eq!(complexity.total, 10);
        assert_eq!(complexity.confidence, 0.8);
    }

    #[test]
    fn test_code_location() {
        let location = CodeLocation {
            file: "test.rs".to_string(),
            line: 42,
            column: 5,
            span: Some((42, 50)),
        };

        assert_eq!(location.file, "test.rs");
        assert_eq!(location.line, 42);
        assert_eq!(location.span, Some((42, 50)));
    }

    #[test]
    fn test_source_mapping() {
        let mapping = SourceMapping {
            complexity_point: 3,
            location: CodeLocation {
                file: "main.rs".to_string(),
                line: 10,
                column: 0,
                span: None,
            },
            ast_path: vec!["module".to_string(), "function".to_string()],
            context: "Test context".to_string(),
        };

        assert_eq!(mapping.complexity_point, 3);
        assert_eq!(mapping.ast_path.len(), 2);
    }
}