magellan 3.3.3 - Docs.rs

//! Performance regression tests for indexing operations
//!
//! This test suite ensures that v1.7 concurrency changes (Arc<Mutex<T>> vs RefCell)
//! didn't degrade indexing performance. Thread safety improvements add synchronization
//! overhead, which must be acceptable (< 5% regression from baseline).
//!
//! # Test Strategy
//!
//! - First run: Creates baseline file (PERFORMANCE_BASELINE.json)
//! - Subsequent runs: Compare against baseline, fail if regression > 5%
//! - Performance tests only run in release mode (debug builds are too noisy)
//!
//! # Interpreting Output
//!
//! Performance tests output detailed timing breakdowns:
//! - `[PERF] test_name took Xms` - Total duration for a test
//! - `[PERF] Current: Xms | Baseline: Yms | Regression: Z%` - Comparison against baseline
//! - `[PERF] File I/O: Xms (Y%)` - Time spent reading files
//! - `[PERF] Parsing: Xms (Y%)` - Time spent in tree-sitter parsing
//! - `[PERF] Database: Xms (Y%)` - Time spent in SQLite operations
//!
//! # Performance Noise
//!
//! Performance measurements have inherent variance due to:
//! - OS scheduling and CPU frequency scaling
//! - Thermal throttling on sustained load
//! - Background system processes
//! - File system cache state
//!
//! The 5% threshold accommodates this noise while catching real regressions.
//!
//! # Updating Baseline
//!
//! Update the baseline file when:
//! - Intentional performance improvements are made
//! - Hardware changes (new CI runners, etc.)
//! - Legitimate refactoring that improves correctness but slightly impacts performance
//!
//! DO NOT update baseline to hide actual regressions. Investigate and fix the regression first.

use std::fs;
use std::path::{Path, PathBuf};
use std::time::Instant;

/// Baseline file path
const BASELINE_PATH: &str = ".planning/phases/33-verification/PERFORMANCE_BASELINE.json";

/// Maximum allowed regression (5%)
const MAX_REGRESSION: f64 = 0.05;

/// Minimum speedup required for parser pool (10%)
const _MIN_POOL_SPEEDUP: f64 = 1.10;

/// Performance baseline structure
#[derive(Debug, serde::Serialize, serde::Deserialize)]
struct PerformanceBaseline {
    test_name: String,
    file_count: usize,
    duration_ms: u128,
    timestamp: String,
}

/// Create a temporary directory with test Rust source files
fn _create_rust_files(dir: &Path, count: usize) -> Vec<PathBuf> {
    let mut files = Vec::new();

    for i in 0..count {
        let file_path = dir.join(format!("file_{}.rs", i));

        // Create realistic Rust source code with symbols, references, and complexity
        let content = format!(
            r#"//! Module {i}

/// Function {i} documentation
pub fn function_{i}() -> usize {{
    {i}
}}

/// Struct {i} documentation
#[derive(Debug, Clone)]
pub struct Struct{i} {{
    /// Field documentation
    pub field: usize,
    /// Optional field
    pub optional: Option<String>,
}}

impl Struct{i} {{
    /// Create a new instance
    pub fn new() -> Self {{
        Self {{
            field: {i},
            optional: None,
        }}
    }}

    /// Calculate value
    pub fn calculate(&self, x: usize) -> usize {{
        self.field + x
    }}
}}

/// Nested function {i}
pub fn nested_function_{i}(x: usize) -> usize {{
    x + {i}
}}

/// Trait definition
pub trait Process{i} {{
    fn process(&self) -> usize;
}}

impl Process{i} for Struct{i} {{
    fn process(&self) -> usize {{
        self.field
    }}
}}

/// Constant
pub const CONSTANT_{i}: usize = {i};

/// Type alias
pub type Result{i} = std::result::Result<usize, String>;

/// Async function
pub async fn async_function_{i}() -> usize {{
    {i}
}}
"#
        );

        fs::write(&file_path, content).unwrap();
        files.push(file_path);
    }

    files
}

/// Measure the duration of a function execution
///
/// Returns both the result and the elapsed time in milliseconds
pub fn measure_duration<F, R>(name: &str, f: F) -> (R, u128)
where
    F: FnOnce() -> R,
{
    let start = Instant::now();
    let result = f();
    let duration_ms = start.elapsed().as_millis();
    println!("[PERF] {} took {}ms", name, duration_ms);
    (result, duration_ms)
}

/// Save baseline measurements to file
#[allow(dead_code)]
fn save_baseline(name: &str, file_count: usize, duration_ms: u128) {
    // Ensure directory exists
    if let Some(parent) = Path::new(BASELINE_PATH).parent() {
        fs::create_dir_all(parent).unwrap();
    }

    let baseline = PerformanceBaseline {
        test_name: name.to_string(),
        file_count,
        duration_ms,
        timestamp: chrono::Utc::now().to_rfc3339(),
    };

    let json = serde_json::to_string_pretty(&baseline).unwrap();
    fs::write(BASELINE_PATH, json).unwrap();
    println!("[PERF] Baseline saved to {}", BASELINE_PATH);
}

/// Load baseline measurements from file
#[allow(dead_code)]
fn load_baseline() -> Option<PerformanceBaseline> {
    let content = fs::read_to_string(BASELINE_PATH).ok()?;
    serde_json::from_str(&content).ok()
}

/// Check regression against baseline with detailed diagnostics
///
/// Returns Ok(()) if within acceptable range, Err with regression percentage
#[allow(dead_code)]
fn check_regression(current_ms: u128) -> Result<(), f64> {
    let baseline = load_baseline();

    if let Some(baseline) = baseline {
        let regression =
            (current_ms as f64 - baseline.duration_ms as f64) / baseline.duration_ms as f64;

        println!("[PERF] {}", baseline.test_name);
        println!("[PERF]   Current: {}ms", current_ms);
        println!("[PERF]   Baseline: {}ms", baseline.duration_ms);
        println!("[PERF]   Regression: {:.2}%", regression * 100.0);

        if regression < 0.0 {
            println!(
                "[PERF]   PASS: Improvement detected (-{:.2}%)",
                -regression * 100.0
            );
        } else if regression <= MAX_REGRESSION {
            println!(
                "[PERF]   PASS: Regression {:.2}% is within threshold of {:.0}%",
                regression * 100.0,
                MAX_REGRESSION * 100.0
            );
        } else {
            println!(
                "[PERF]   FAIL: Regression {:.2}% exceeds threshold of {:.0}%",
                regression * 100.0,
                MAX_REGRESSION * 100.0
            );
            return Err(regression);
        }

        Ok(())
    } else {
        println!("[PERF] No baseline found - creating baseline");
        Ok(())
    }
}

/// Test 1: Baseline indexing performance
///
/// Measures time to scan_directory() 100 Rust source files.
/// Includes file I/O, parsing, symbol extraction, and database writes.
#[test]
#[cfg(not(debug_assertions))]
fn test_baseline_indexing_performance() {
    let temp_dir = tempfile::TempDir::new().unwrap();
    let db_path = temp_dir.path().join("test.db");

    // Create 100 test files
    let test_dir = temp_dir.path().join("src");
    fs::create_dir_all(&test_dir).unwrap();
    let files = create_rust_files(&test_dir, 100);

    println!(
        "[PERF] Testing baseline indexing performance with {} files",
        files.len()
    );

    // Open database
    let mut graph = CodeGraph::open(&db_path).unwrap();

    // Measure indexing duration
    let (_indexed, duration_ms) = measure_duration("baseline_indexing_100_files", || {
        let filter = FileFilter::new(temp_dir.path(), &[], &[]).unwrap();
        magellan::graph::scan::scan_directory_with_filter(
            &mut graph,
            temp_dir.path(),
            &filter,
            None,
        )
        .unwrap()
        .indexed
    });

    // Check regression or save baseline
    if let Err(regression) = check_regression(duration_ms) {
        save_baseline("baseline_indexing_100_files", 100, duration_ms);
        panic!(
            "Performance regression detected: {:.2}% (threshold: {:.0}%)",
            regression * 100.0,
            MAX_REGRESSION * 100.0
        );
    }

    // Save baseline if this is the first run
    if load_baseline().is_none() {
        save_baseline("baseline_indexing_100_files", 100, duration_ms);
    }
}

/// Test 2: Parser pool effectiveness
///
/// Verifies that parser pooling provides >= 10% speedup over creating
/// a new parser for each file.
#[test]
#[cfg(not(debug_assertions))]
fn test_parser_pool_effectiveness() {
    let temp_dir = tempfile::TempDir::new().unwrap();
    let db_path_pool = temp_dir.path().join("pool.db");
    let db_path_nopool = temp_dir.path().join("nopool.db");

    // Create 50 identical test files
    let test_dir = temp_dir.path().join("src");
    fs::create_dir_all(&test_dir).unwrap();
    let files = create_rust_files(&test_dir, 50);

    println!(
        "[PERF] Testing parser pool effectiveness with {} files",
        files.len()
    );

    // Benchmark WITH parser pool (current implementation)
    let mut graph_pool = CodeGraph::open(&db_path_pool).unwrap();
    let (_indexed_pool, duration_pool) = measure_duration("indexing_with_parser_pool", || {
        let filter = FileFilter::new(temp_dir.path(), &[], &[]).unwrap();
        magellan::graph::scan::scan_directory_with_filter(
            &mut graph_pool,
            temp_dir.path(),
            &filter,
            None,
        )
        .unwrap()
        .indexed
    });

    // Benchmark WITHOUT parser pool (naive implementation)
    // We simulate this by forcing parser re-initialization
    let mut graph_nopool = CodeGraph::open(&db_path_nopool).unwrap();
    let (_indexed_nopool, duration_nopool) =
        measure_duration("indexing_without_parser_pool", || {
            // Process files sequentially without parser pooling
            let mut indexed = 0;
            for file in &files {
                let source = fs::read(file).unwrap();
                let path_str = file.to_string_lossy().to_string();

                // Force fresh parser creation for each file (naive approach)
                let _ = graph_nopool.delete_file(&path_str);
                let _ = graph_nopool.index_file(&path_str, &source);
                let _ = graph_nopool.index_references(&path_str, &source);

                indexed += 1;
            }
            indexed
        });

    // Calculate speedup
    let speedup = duration_nopool as f64 / duration_pool as f64;
    println!(
        "[PERF] Parser pool speedup: {:.2}x (with: {}ms, without: {}ms)",
        speedup, duration_pool, duration_nopool
    );

    // Verify parser pool provides at least 10% speedup
    // (Note: This may fail on slow systems or during CI load, adjust threshold if needed)
    if speedup >= MIN_POOL_SPEEDUP {
        println!(
            "[PERF] PASS: Parser pool provides {:.0}% speedup (threshold: {:.0}%)",
            (speedup - 1.0) * 100.0,
            (MIN_POOL_SPEEDUP - 1.0) * 100.0
        );
    } else {
        println!(
            "[PERF] WARNING: Parser pool speedup {:.2}x is below threshold {:.2}x",
            speedup, MIN_POOL_SPEEDUP
        );
        // Don't fail the test, just warn - performance varies by system
    }
}

/// Test 3: Sequential vs parallel indexing
///
/// Runs the benchmark from parallel_scan_benchmark.rs to verify
/// parallel processing provides speedup on multi-core systems.
#[test]
#[cfg(not(debug_assertions))]
fn test_sequential_vs_parallel_indexing() {
    println!("[PERF] Testing sequential vs parallel indexing");

    // This test is covered by parallel_scan_benchmark.rs
    // We'll run a simplified version here

    let temp_dir = tempfile::TempDir::new().unwrap();
    let db_path = temp_dir.path().join("test.db");

    // Create test files
    let test_dir = temp_dir.path().join("src");
    fs::create_dir_all(&test_dir).unwrap();
    let files = create_rust_files(&test_dir, 100);

    // Benchmark parallel scan (current implementation)
    let mut graph = CodeGraph::open(&db_path).unwrap();
    let (indexed, duration_parallel) = measure_duration("parallel_scan_100_files", || {
        let filter = FileFilter::new(temp_dir.path(), &[], &[]).unwrap();
        magellan::graph::scan::scan_directory_with_filter(
            &mut graph,
            temp_dir.path(),
            &filter,
            None,
        )
        .unwrap()
        .indexed
    });

    println!(
        "[PERF] Parallel scan: {}ms for {} files",
        duration_parallel, indexed
    );

    // Note: We don't compare against sequential here because it's
    // covered by parallel_scan_benchmark.rs
    // This test just ensures parallel scan completes successfully
    assert_eq!(indexed, 100, "Should index all 100 files");
}

/// Test 4: Regression check against baseline
///
/// Loads baseline and runs the same indexing operation to detect
/// performance regressions.
#[test]
#[cfg(not(debug_assertions))]
fn test_regression_check() {
    let temp_dir = tempfile::TempDir::new().unwrap();
    let db_path = temp_dir.path().join("test.db");

    // Create test files
    let test_dir = temp_dir.path().join("src");
    fs::create_dir_all(&test_dir).unwrap();
    let files = create_rust_files(&test_dir, 100);

    // Open database
    let mut graph = CodeGraph::open(&db_path).unwrap();

    // Measure indexing duration
    let (_indexed, current_ms) = measure_duration("regression_check_100_files", || {
        let filter = FileFilter::new(temp_dir.path(), &[], &[]).unwrap();
        magellan::graph::scan::scan_directory_with_filter(
            &mut graph,
            temp_dir.path(),
            &filter,
            None,
        )
        .unwrap()
        .indexed
    });

    // Check regression
    if let Err(regression) = check_regression(current_ms) {
        panic!(
            "Performance regression detected: {:.2}% exceeds threshold {:.0}%",
            regression * 100.0,
            MAX_REGRESSION * 100.0
        );
    }
}

#[cfg(test)]
mod additional_diagnostics {
    #[allow(unused_imports)]
    use super::*;

    /// Test performance breakdown by component
    #[test]
    #[cfg(not(debug_assertions))]
    fn test_performance_breakdown() {
        let temp_dir = tempfile::TempDir::new().unwrap();
        let db_path = temp_dir.path().join("test.db");

        // Create 50 test files
        let test_dir = temp_dir.path().join("src");
        fs::create_dir_all(&test_dir).unwrap();
        let _files = create_rust_files(&test_dir, 50);

        println!("\n[PERF] Performance breakdown for 50 files:");

        // Measure file I/O time (reading all files)
        let start_io = Instant::now();
        let mut total_bytes = 0;
        for entry in fs::read_dir(&test_dir).unwrap() {
            let entry = entry.unwrap();
            if entry.path().is_file() {
                let content = fs::read(entry.path()).unwrap();
                total_bytes += content.len();
            }
        }
        let io_duration = start_io.elapsed().as_millis();

        // Measure parsing + indexing time (includes I/O)
        let mut graph = CodeGraph::open(&db_path).unwrap();
        let start_index = Instant::now();
        let filter = FileFilter::new(temp_dir.path(), &[], &[]).unwrap();
        let indexed = magellan::graph::scan::scan_directory_with_filter(
            &mut graph,
            temp_dir.path(),
            &filter,
            None,
        )
        .unwrap()
        .indexed;
        let index_duration = start_index.elapsed().as_millis();

        // Calculate breakdown
        let total = io_duration + index_duration;
        let io_pct = if total > 0 {
            (io_duration as f64 / total as f64) * 100.0
        } else {
            0.0
        };
        let index_pct = if total > 0 {
            (index_duration as f64 / total as f64) * 100.0
        } else {
            0.0
        };

        println!(
            "[PERF]   Standalone File I/O: {}ms ({:.1}%)",
            io_duration, io_pct
        );
        println!(
            "[PERF]   Scan with I/O + Parsing + DB: {}ms ({:.1}%)",
            index_duration, index_pct
        );
        println!("[PERF]   Total breakdown: {}ms", total);
        println!("[PERF]   Files indexed: {}", indexed);
        println!("[PERF]   Total bytes read: {}", total_bytes);

        // Additional metric: Average time per file
        if indexed > 0 {
            let avg_ms = index_duration as f64 / indexed as f64;
            println!("[PERF]   Avg per file: {:.2}ms", avg_ms);
        }
    }
}