pub mod imports;
pub mod resolver;
pub use imports::extract_imports;
pub use resolver::resolve_import;
use crate::scan::facts::ScanFacts;
use serde::{Deserialize, Serialize};
use std::collections::{BTreeMap, BTreeSet, HashMap, HashSet};
use std::path::{Path, PathBuf};
#[derive(Debug, Clone, Serialize, Deserialize, PartialEq, Eq)]
pub struct CouplingGraph {
pub edges: BTreeMap<PathBuf, BTreeSet<PathBuf>>,
pub nodes: BTreeSet<PathBuf>,
}
pub struct FileMetrics {
pub path: PathBuf,
pub fan_in: usize,
pub fan_out: usize,
pub instability: f32,
}
pub fn build_coupling_graph(facts: &ScanFacts, root: &Path) -> CouplingGraph {
let known_files: HashSet<PathBuf> = facts.files.iter().map(|f| f.path.clone()).collect();
let mut edges: BTreeMap<PathBuf, BTreeSet<PathBuf>> = BTreeMap::new();
for file in &facts.files {
let outgoing = edges.entry(file.path.clone()).or_default();
for raw in &file.imports {
if let Some(target) = resolve_import(raw, &file.path, root, &known_files) {
if target != file.path {
outgoing.insert(target);
}
}
}
}
let mut nodes: BTreeSet<PathBuf> = edges.keys().cloned().collect();
for targets in edges.values() {
nodes.extend(targets.iter().cloned());
}
CouplingGraph { edges, nodes }
}
pub fn compute_metrics(graph: &CouplingGraph) -> Vec<FileMetrics> {
let mut fan_out: HashMap<&PathBuf, usize> = HashMap::new();
let mut fan_in: HashMap<&PathBuf, usize> = HashMap::new();
for (from, targets) in &graph.edges {
fan_out.insert(from, targets.len());
for target in targets {
*fan_in.entry(target).or_insert(0) += 1;
}
}
graph
.nodes
.iter()
.map(|path| {
let fo = fan_out.get(path).copied().unwrap_or(0);
let fi = fan_in.get(path).copied().unwrap_or(0);
let instability = if fo + fi == 0 {
0.0_f32
} else {
fo as f32 / (fi + fo) as f32
};
FileMetrics {
path: path.clone(),
fan_in: fi,
fan_out: fo,
instability,
}
})
.collect()
}
const MAX_DFS_DEPTH: usize = 512;
pub fn detect_cycles(graph: &CouplingGraph) -> Vec<Vec<PathBuf>> {
let nodes: Vec<&PathBuf> = graph.nodes.iter().collect();
let n = nodes.len();
let index: HashMap<&PathBuf, usize> = nodes.iter().enumerate().map(|(i, p)| (*p, i)).collect();
let adj: Vec<Vec<usize>> = nodes
.iter()
.map(|node| {
graph
.edges
.get(*node)
.map(|targets| {
targets
.iter()
.filter_map(|t| index.get(t).copied())
.collect()
})
.unwrap_or_default()
})
.collect();
let mut state = vec![0u8; n];
let mut stack: Vec<usize> = Vec::new();
let mut cycles: Vec<Vec<PathBuf>> = Vec::new();
for start in 0..n {
if state[start] == 0 {
dfs(start, &adj, &mut state, &mut stack, &mut cycles, &nodes, 0);
}
}
for cycle in &mut cycles {
if let Some(min_pos) = cycle
.iter()
.enumerate()
.min_by(|a, b| a.1.cmp(b.1))
.map(|(i, _)| i)
{
cycle.rotate_left(min_pos);
}
}
cycles.sort();
cycles.dedup();
cycles
}
fn dfs(
node: usize,
adj: &[Vec<usize>],
state: &mut Vec<u8>,
stack: &mut Vec<usize>,
cycles: &mut Vec<Vec<PathBuf>>,
nodes: &[&PathBuf],
depth: usize,
) {
if depth > MAX_DFS_DEPTH {
state[node] = 2;
return;
}
state[node] = 1;
stack.push(node);
for &neighbor in &adj[node] {
match state[neighbor] {
1 => {
if let Some(pos) = stack.iter().position(|&n| n == neighbor) {
let cycle = stack[pos..].iter().map(|&i| nodes[i].clone()).collect();
cycles.push(cycle);
}
}
0 => dfs(neighbor, adj, state, stack, cycles, nodes, depth + 1),
_ => {}
}
}
stack.pop();
state[node] = 2;
}
#[cfg(test)]
mod tests {
use super::*;
fn graph_from_edges(edges: &[(&str, &str)]) -> CouplingGraph {
let mut edge_map: BTreeMap<PathBuf, BTreeSet<PathBuf>> = BTreeMap::new();
let mut nodes: BTreeSet<PathBuf> = BTreeSet::new();
for (src, dst) in edges {
let src = PathBuf::from(src);
let dst = PathBuf::from(dst);
nodes.insert(src.clone());
nodes.insert(dst.clone());
edge_map.entry(src).or_default().insert(dst);
}
CouplingGraph {
edges: edge_map,
nodes,
}
}
#[test]
fn detects_simple_two_node_cycle() {
let graph = graph_from_edges(&[("a.rs", "b.rs"), ("b.rs", "a.rs")]);
let cycles = detect_cycles(&graph);
assert_eq!(cycles.len(), 1);
assert_eq!(cycles[0].len(), 2);
}
#[test]
fn detects_three_node_cycle() {
let graph = graph_from_edges(&[("a.rs", "b.rs"), ("b.rs", "c.rs"), ("c.rs", "a.rs")]);
let cycles = detect_cycles(&graph);
assert_eq!(cycles.len(), 1);
assert_eq!(cycles[0].len(), 3);
}
#[test]
fn no_cycle_in_dag() {
let graph = graph_from_edges(&[("a.rs", "b.rs"), ("b.rs", "c.rs"), ("a.rs", "c.rs")]);
let cycles = detect_cycles(&graph);
assert!(cycles.is_empty());
}
#[test]
fn disconnected_graph_no_cycle() {
let graph = graph_from_edges(&[("a.rs", "b.rs"), ("c.rs", "d.rs")]);
let cycles = detect_cycles(&graph);
assert!(cycles.is_empty());
}
#[test]
fn compute_metrics_fan_in_and_fan_out() {
let graph = graph_from_edges(&[("a.rs", "b.rs"), ("a.rs", "c.rs"), ("b.rs", "c.rs")]);
let metrics = compute_metrics(&graph);
let find = |name: &str| -> Option<(usize, usize)> {
metrics
.iter()
.find(|m| m.path == std::path::Path::new(name))
.map(|m| (m.fan_in, m.fan_out))
};
let (a_in, a_out) = find("a.rs").expect("a.rs metrics should exist");
let (b_in, b_out) = find("b.rs").expect("b.rs metrics should exist");
let (c_in, c_out) = find("c.rs").expect("c.rs metrics should exist");
assert_eq!(a_out, 2);
assert_eq!(a_in, 0);
assert_eq!(b_out, 1);
assert_eq!(b_in, 1);
assert_eq!(c_out, 0);
assert_eq!(c_in, 2);
}
}