Skip to main content

sloc_core/
delta.rs

1// SPDX-License-Identifier: AGPL-3.0-or-later
2// Copyright (C) 2026 Nima Shafie <nimzshafie@gmail.com>
3
4use std::collections::{BTreeSet, HashMap, HashSet};
5
6use chrono::{DateTime, Utc};
7use serde::Serialize;
8
9use crate::{AnalysisRun, EffectiveCounts, FileRecord};
10
11#[derive(Debug, Serialize)]
12pub struct SummaryDelta {
13    pub baseline_run_id: String,
14    pub current_run_id: String,
15    pub baseline_timestamp: DateTime<Utc>,
16    pub current_timestamp: DateTime<Utc>,
17    pub baseline_files: u64,
18    pub current_files: u64,
19    pub files_analyzed_delta: i64,
20    pub baseline_code: u64,
21    pub current_code: u64,
22    pub code_lines_delta: i64,
23    pub baseline_comments: u64,
24    pub current_comments: u64,
25    pub comment_lines_delta: i64,
26    pub blank_lines_delta: i64,
27    pub total_lines_delta: i64,
28    /// Lines hit delta (positive = more covered). `None` if neither run has coverage data.
29    #[serde(skip_serializing_if = "Option::is_none")]
30    pub coverage_lines_hit_delta: Option<i64>,
31    /// Line coverage percentage delta (positive = improved). `None` if neither run has coverage.
32    #[serde(skip_serializing_if = "Option::is_none")]
33    pub coverage_line_pct_delta: Option<f64>,
34    /// Baseline line coverage percentage. `None` if baseline had no coverage data.
35    #[serde(skip_serializing_if = "Option::is_none")]
36    pub baseline_coverage_line_pct: Option<f64>,
37    /// Current line coverage percentage. `None` if current has no coverage data.
38    #[serde(skip_serializing_if = "Option::is_none")]
39    pub current_coverage_line_pct: Option<f64>,
40}
41
42#[derive(Debug, Serialize, PartialEq, Eq, Clone, Copy)]
43#[serde(rename_all = "snake_case")]
44pub enum FileChangeStatus {
45    Added,
46    Removed,
47    Modified,
48    Unchanged,
49}
50
51#[derive(Debug, Serialize)]
52pub struct FileDelta {
53    pub relative_path: String,
54    pub language: Option<String>,
55    pub status: FileChangeStatus,
56    pub baseline_code: i64,
57    pub current_code: i64,
58    pub code_delta: i64,
59    pub baseline_comment: i64,
60    pub current_comment: i64,
61    pub comment_delta: i64,
62    pub baseline_blank: i64,
63    pub current_blank: i64,
64    pub blank_delta: i64,
65    pub total_delta: i64,
66}
67
68#[derive(Debug, Serialize)]
69pub struct ScanComparison {
70    pub summary: SummaryDelta,
71    pub file_deltas: Vec<FileDelta>,
72    pub files_added: usize,
73    pub files_removed: usize,
74    pub files_modified: usize,
75    pub files_unchanged: usize,
76}
77
78fn build_modified(record: &FileRecord, base: &EffectiveCounts, lang: Option<String>) -> FileDelta {
79    let curr = &record.effective_counts;
80    let code_delta = curr.code_lines.cast_signed() - base.code_lines.cast_signed();
81    let comment_delta = curr.comment_lines.cast_signed() - base.comment_lines.cast_signed();
82    let blank_delta = curr.blank_lines.cast_signed() - base.blank_lines.cast_signed();
83    let status = if code_delta == 0 && comment_delta == 0 && blank_delta == 0 {
84        FileChangeStatus::Unchanged
85    } else {
86        FileChangeStatus::Modified
87    };
88    FileDelta {
89        relative_path: record.relative_path.clone(),
90        language: lang,
91        status,
92        baseline_code: base.code_lines.cast_signed(),
93        current_code: curr.code_lines.cast_signed(),
94        code_delta,
95        baseline_comment: base.comment_lines.cast_signed(),
96        current_comment: curr.comment_lines.cast_signed(),
97        comment_delta,
98        baseline_blank: base.blank_lines.cast_signed(),
99        current_blank: curr.blank_lines.cast_signed(),
100        blank_delta,
101        total_delta: code_delta + comment_delta + blank_delta,
102    }
103}
104
105fn build_added(record: &FileRecord, lang: Option<String>) -> FileDelta {
106    let curr = &record.effective_counts;
107    let total = (curr.code_lines + curr.comment_lines + curr.blank_lines).cast_signed();
108    FileDelta {
109        relative_path: record.relative_path.clone(),
110        language: lang,
111        status: FileChangeStatus::Added,
112        baseline_code: 0,
113        current_code: curr.code_lines.cast_signed(),
114        code_delta: curr.code_lines.cast_signed(),
115        baseline_comment: 0,
116        current_comment: curr.comment_lines.cast_signed(),
117        comment_delta: curr.comment_lines.cast_signed(),
118        baseline_blank: 0,
119        current_blank: curr.blank_lines.cast_signed(),
120        blank_delta: curr.blank_lines.cast_signed(),
121        total_delta: total,
122    }
123}
124
125fn build_removed(path: &str, base: &EffectiveCounts, lang: Option<String>) -> FileDelta {
126    let total = (base.code_lines + base.comment_lines + base.blank_lines).cast_signed();
127    FileDelta {
128        relative_path: path.to_string(),
129        language: lang,
130        status: FileChangeStatus::Removed,
131        baseline_code: base.code_lines.cast_signed(),
132        current_code: 0,
133        code_delta: -(base.code_lines.cast_signed()),
134        baseline_comment: base.comment_lines.cast_signed(),
135        current_comment: 0,
136        comment_delta: -(base.comment_lines.cast_signed()),
137        baseline_blank: base.blank_lines.cast_signed(),
138        current_blank: 0,
139        blank_delta: -(base.blank_lines.cast_signed()),
140        total_delta: -total,
141    }
142}
143
144#[allow(clippy::cast_precision_loss)]
145fn coverage_line_pct(hit: u64, found: u64) -> Option<f64> {
146    if found == 0 {
147        None
148    } else {
149        let pct = (hit as f64 / found as f64) * 100.0;
150        Some((pct * 10.0).round() / 10.0)
151    }
152}
153
154#[must_use]
155#[allow(clippy::too_many_lines)]
156pub fn compute_delta(baseline: &AnalysisRun, current: &AnalysisRun) -> ScanComparison {
157    let baseline_map: HashMap<&str, &EffectiveCounts> = baseline
158        .per_file_records
159        .iter()
160        .map(|f| (f.relative_path.as_str(), &f.effective_counts))
161        .collect();
162
163    let current_paths: HashSet<&str> = current
164        .per_file_records
165        .iter()
166        .map(|f| f.relative_path.as_str())
167        .collect();
168
169    let mut file_deltas: Vec<FileDelta> = Vec::new();
170
171    for record in &current.per_file_records {
172        let path = record.relative_path.as_str();
173        let lang = record.language.map(|l| l.display_name().to_string());
174        if let Some(base) = baseline_map.get(path) {
175            file_deltas.push(build_modified(record, base, lang));
176        } else {
177            file_deltas.push(build_added(record, lang));
178        }
179    }
180
181    for record in &baseline.per_file_records {
182        if !current_paths.contains(record.relative_path.as_str()) {
183            let lang = record.language.map(|l| l.display_name().to_string());
184            file_deltas.push(build_removed(
185                &record.relative_path,
186                &record.effective_counts,
187                lang,
188            ));
189        }
190    }
191
192    file_deltas.sort_by(|a, b| {
193        const fn order(s: FileChangeStatus) -> u8 {
194            match s {
195                FileChangeStatus::Modified => 0,
196                FileChangeStatus::Added => 1,
197                FileChangeStatus::Removed => 2,
198                FileChangeStatus::Unchanged => 3,
199            }
200        }
201        order(a.status)
202            .cmp(&order(b.status))
203            .then(a.relative_path.cmp(&b.relative_path))
204    });
205
206    let files_added = file_deltas
207        .iter()
208        .filter(|f| f.status == FileChangeStatus::Added)
209        .count();
210    let files_removed = file_deltas
211        .iter()
212        .filter(|f| f.status == FileChangeStatus::Removed)
213        .count();
214    let files_modified = file_deltas
215        .iter()
216        .filter(|f| f.status == FileChangeStatus::Modified)
217        .count();
218    let files_unchanged = file_deltas
219        .iter()
220        .filter(|f| f.status == FileChangeStatus::Unchanged)
221        .count();
222
223    let s = &current.summary_totals;
224    let b = &baseline.summary_totals;
225
226    let baseline_cov_pct = coverage_line_pct(b.coverage_lines_hit, b.coverage_lines_found);
227    let current_cov_pct = coverage_line_pct(s.coverage_lines_hit, s.coverage_lines_found);
228    let coverage_lines_hit_delta = if b.coverage_lines_found > 0 || s.coverage_lines_found > 0 {
229        Some(s.coverage_lines_hit.cast_signed() - b.coverage_lines_hit.cast_signed())
230    } else {
231        None
232    };
233    let coverage_line_pct_delta = match (baseline_cov_pct, current_cov_pct) {
234        (Some(base_pct), Some(cur_pct)) => Some(((cur_pct - base_pct) * 10.0).round() / 10.0),
235        (None, Some(cur_pct)) => Some(cur_pct),
236        _ => None,
237    };
238
239    ScanComparison {
240        summary: SummaryDelta {
241            baseline_run_id: baseline.tool.run_id.clone(),
242            current_run_id: current.tool.run_id.clone(),
243            baseline_timestamp: baseline.tool.timestamp_utc,
244            current_timestamp: current.tool.timestamp_utc,
245            baseline_files: b.files_analyzed,
246            current_files: s.files_analyzed,
247            files_analyzed_delta: s.files_analyzed.cast_signed() - b.files_analyzed.cast_signed(),
248            baseline_code: b.code_lines,
249            current_code: s.code_lines,
250            code_lines_delta: s.code_lines.cast_signed() - b.code_lines.cast_signed(),
251            baseline_comments: b.comment_lines,
252            current_comments: s.comment_lines,
253            comment_lines_delta: s.comment_lines.cast_signed() - b.comment_lines.cast_signed(),
254            blank_lines_delta: s.blank_lines.cast_signed() - b.blank_lines.cast_signed(),
255            total_lines_delta: s
256                .total_physical_lines
257                .cast_signed()
258                .wrapping_sub(b.total_physical_lines.cast_signed()),
259            coverage_lines_hit_delta,
260            coverage_line_pct_delta,
261            baseline_coverage_line_pct: baseline_cov_pct,
262            current_coverage_line_pct: current_cov_pct,
263        },
264        file_deltas,
265        files_added,
266        files_removed,
267        files_modified,
268        files_unchanged,
269    }
270}
271
272// ── Multi-point comparison ─────────────────────────────────────────────────────
273
274/// Summary metrics snapshot for one scan in a multi-point timeline.
275#[derive(Debug, Serialize)]
276pub struct MultiScanPoint {
277    pub run_id: String,
278    pub timestamp: DateTime<Utc>,
279    pub git_commit: Option<String>,
280    pub git_branch: Option<String>,
281    pub git_tags: Option<String>,
282    pub git_nearest_tag: Option<String>,
283    pub code_lines: i64,
284    pub comment_lines: i64,
285    pub blank_lines: i64,
286    pub files_analyzed: i64,
287    pub test_count: i64,
288    pub coverage_line_pct: Option<f64>,
289}
290
291/// Per-file code counts across N scan points.
292#[derive(Debug, Serialize)]
293pub struct MultiFileDelta {
294    pub relative_path: String,
295    pub language: Option<String>,
296    /// Code lines at each scan (`None` = file absent at that point).
297    pub code_per_scan: Vec<Option<i64>>,
298    /// Delta from previous scan; index 0 is always `None`.
299    pub code_delta_per_scan: Vec<Option<i64>>,
300    /// `"added"` | `"removed"` | `"modified"` | `"unchanged"`
301    pub overall_status: String,
302    /// Code delta from first presence to last presence.
303    pub total_code_delta: i64,
304}
305
306#[derive(Debug, Serialize)]
307pub struct MultiScanComparison {
308    pub points: Vec<MultiScanPoint>,
309    /// One `ScanComparison` per consecutive pair (length = N − 1).
310    pub sequential_deltas: Vec<ScanComparison>,
311    /// Overall delta from the first scan to the last scan.
312    pub total_delta: SummaryDelta,
313    /// All files × all scan points, sorted modified → added → removed → unchanged.
314    pub file_matrix: Vec<MultiFileDelta>,
315}
316
317/// Per-scan deltas for a single file path: delta[0] is always None (no previous), delta[i] is
318/// code[i] - code[i-1], or None when both sides are absent.
319fn sequential_code_deltas(code_per_scan: &[Option<i64>]) -> Vec<Option<i64>> {
320    let mut deltas = vec![None];
321    for i in 1..code_per_scan.len() {
322        if code_per_scan[i - 1].is_some() || code_per_scan[i].is_some() {
323            let prev = code_per_scan[i - 1].unwrap_or(0);
324            let curr = code_per_scan[i].unwrap_or(0);
325            deltas.push(Some(curr - prev));
326        } else {
327            deltas.push(None);
328        }
329    }
330    deltas
331}
332
333/// Classify a file's lifetime across scans as "added", "removed", "modified", or "unchanged".
334fn classify_file_status(code_per_scan: &[Option<i64>]) -> &'static str {
335    let n = code_per_scan.len();
336    let first_idx = code_per_scan.iter().position(Option::is_some);
337    let last_idx = code_per_scan.iter().rposition(Option::is_some);
338    match (first_idx, last_idx) {
339        (Some(f), Some(l)) if f > 0 && l == n - 1 => "added",
340        (Some(f), Some(l)) if f == 0 && l < n - 1 => "removed",
341        (Some(f), Some(l)) => {
342            let first_val = code_per_scan[f].unwrap_or(0);
343            if code_per_scan[f..=l]
344                .iter()
345                .all(|v| v.is_none_or(|x| x == first_val))
346            {
347                "unchanged"
348            } else {
349                "modified"
350            }
351        }
352        _ => "unchanged",
353    }
354}
355
356/// Net code-line change from the first scan where the file appeared to the last.
357fn net_code_delta(code_per_scan: &[Option<i64>]) -> i64 {
358    let first_idx = code_per_scan.iter().position(Option::is_some);
359    let last_idx = code_per_scan.iter().rposition(Option::is_some);
360    match (first_idx, last_idx) {
361        (Some(f), Some(l)) => code_per_scan[l].unwrap_or(0) - code_per_scan[f].unwrap_or(0),
362        _ => 0,
363    }
364}
365
366/// Compute a multi-point timeline comparison.
367///
368/// `runs` must be sorted chronologically (oldest first) and contain at least 2 elements.
369///
370/// # Panics
371///
372/// Panics if `runs` contains fewer than 2 elements.
373#[must_use]
374#[allow(clippy::cast_precision_loss)]
375pub fn compute_multi_delta(runs: &[&AnalysisRun]) -> MultiScanComparison {
376    assert!(
377        runs.len() >= 2,
378        "compute_multi_delta requires at least 2 runs"
379    );
380
381    // Union of all file paths across every run.
382    let all_paths: BTreeSet<String> = runs
383        .iter()
384        .flat_map(|r| r.per_file_records.iter().map(|f| f.relative_path.clone()))
385        .collect();
386
387    // Per-run lookup: path → FileRecord.
388    let run_maps: Vec<HashMap<&str, &FileRecord>> = runs
389        .iter()
390        .map(|r| {
391            r.per_file_records
392                .iter()
393                .map(|f| (f.relative_path.as_str(), f))
394                .collect()
395        })
396        .collect();
397
398    // Build the file matrix.
399    let mut file_matrix: Vec<MultiFileDelta> = all_paths
400        .into_iter()
401        .map(|path| {
402            let code_per_scan: Vec<Option<i64>> = run_maps
403                .iter()
404                .map(|m| {
405                    m.get(path.as_str())
406                        .map(|r| r.effective_counts.code_lines.cast_signed())
407                })
408                .collect();
409            let code_delta_per_scan = sequential_code_deltas(&code_per_scan);
410            let overall_status = classify_file_status(&code_per_scan).to_string();
411            let total_code_delta = net_code_delta(&code_per_scan);
412            let language = run_maps.iter().find_map(|m| {
413                m.get(path.as_str())
414                    .and_then(|r| r.language)
415                    .map(|l| l.display_name().to_string())
416            });
417            MultiFileDelta {
418                relative_path: path,
419                language,
420                code_per_scan,
421                code_delta_per_scan,
422                overall_status,
423                total_code_delta,
424            }
425        })
426        .collect();
427
428    // Sort: modified → added → removed → unchanged, then path.
429    file_matrix.sort_by(|a, b| {
430        const fn status_order(s: &str) -> u8 {
431            match s.as_bytes() {
432                b"modified" => 0,
433                b"added" => 1,
434                b"removed" => 2,
435                _ => 3,
436            }
437        }
438        status_order(&a.overall_status)
439            .cmp(&status_order(&b.overall_status))
440            .then(a.relative_path.cmp(&b.relative_path))
441    });
442
443    // Sequential deltas (N - 1 pairs).
444    let sequential_deltas: Vec<ScanComparison> = (0..runs.len() - 1)
445        .map(|i| compute_delta(runs[i], runs[i + 1]))
446        .collect();
447
448    // Overall first-to-last delta.
449    let total_delta = compute_delta(runs[0], runs[runs.len() - 1]).summary;
450
451    // Build scan-point summaries.
452    let points: Vec<MultiScanPoint> = runs
453        .iter()
454        .map(|r| {
455            let s = &r.summary_totals;
456            let coverage_line_pct = if s.coverage_lines_found > 0 {
457                Some(
458                    ((s.coverage_lines_hit as f64 / s.coverage_lines_found as f64 * 1000.0)
459                        .round())
460                        / 10.0,
461                )
462            } else {
463                None
464            };
465            MultiScanPoint {
466                run_id: r.tool.run_id.clone(),
467                timestamp: r.tool.timestamp_utc,
468                git_commit: r.git_commit_short.clone(),
469                git_branch: r.git_branch.clone(),
470                git_tags: r.git_tags.clone(),
471                git_nearest_tag: r.git_nearest_tag.clone(),
472                code_lines: s.code_lines.cast_signed(),
473                comment_lines: s.comment_lines.cast_signed(),
474                blank_lines: s.blank_lines.cast_signed(),
475                files_analyzed: s.files_analyzed.cast_signed(),
476                test_count: s.test_count.cast_signed(),
477                coverage_line_pct,
478            }
479        })
480        .collect();
481
482    MultiScanComparison {
483        points,
484        sequential_deltas,
485        total_delta,
486        file_matrix,
487    }
488}