Skip to main content

gkit_core/
submodules.rs

1//! Submodule traversal + parallel evaluation with deterministic output order.
2//!
3//! Mirrors the zsh recursion (`gitCoreLib.sh` `isEverythingCheckedIn` →
4//! `git submodule foreach`): each repo's submodules are checked before the repo
5//! itself, so the emit order is **post-order DFS** (children first, superproject
6//! last), siblings in submodule-config order. Checks run in parallel for speed,
7//! but results are buffered into fixed slots so output never depends on which
8//! thread finishes first.
9
10use crate::checks::{self, RepoStatus};
11use crate::git::Git;
12use std::path::{Path, PathBuf};
13
14/// One evaluated repo (or submodule).
15pub struct Entry {
16    pub path: PathBuf,
17    pub status: RepoStatus,
18}
19
20/// Direct submodule paths (absolute) of `dir`, in `git submodule status` order.
21/// Uninitialized submodules (status `-`) are skipped — nothing to check.
22fn direct_submodules(git: &dyn Git, dir: &Path) -> Vec<PathBuf> {
23    git.run(dir, &["submodule", "status"])
24        .stdout
25        .lines()
26        .filter_map(|line| {
27            let status = line.chars().next()?;
28            if status == '-' {
29                return None; // uninitialized
30            }
31            // Drop the 1-char status column; remainder is "<sha> <path> (<describe>)".
32            let path = line[1..].split_whitespace().nth(1)?;
33            Some(dir.join(path))
34        })
35        .collect()
36}
37
38/// All repos to check rooted at `root`, in post-order (submodules before parent,
39/// `root` last).
40/// Public: repos rooted at `root` in post-order DFS (submodules before parent,
41/// `root` last). Reused by `stmb` to walk the same tree.
42pub fn repo_paths(git: &dyn Git, root: &Path) -> Vec<PathBuf> {
43    collect_repos(git, root)
44}
45
46/// Is `dir` inside a git work tree? (`git rev-parse --is-inside-work-tree`
47/// prints `true` and exits 0). False for a missing dir or a plain directory.
48fn is_work_tree(git: &dyn Git, dir: &Path) -> bool {
49    let r = git.run(dir, &["rev-parse", "--is-inside-work-tree"]);
50    r.success && r.trimmed() == "true"
51}
52
53fn collect_repos(git: &dyn Git, root: &Path) -> Vec<PathBuf> {
54    fn visit(git: &dyn Git, dir: &Path, order: &mut Vec<PathBuf>) {
55        for sub in direct_submodules(git, dir) {
56            visit(git, &sub, order);
57        }
58        order.push(dir.to_path_buf());
59    }
60    let mut order = Vec::new();
61    visit(git, root, &mut order);
62    order
63}
64
65/// Evaluate `root` and all (recursive) submodules. Checks run in parallel; the
66/// returned Vec is in the fixed post-order DFS order.
67///
68/// `base_override` (the CLI `--base-branch`) applies only to the root; each
69/// submodule resolves its own base (`gkit.baseBranch`, then remote
70/// `origin/main`/`origin/master`). Like the zsh, submodules are fetched before
71/// checking (when `fetch`), the root is not.
72pub fn evaluate_tree<G: Git + Sync>(
73    git: &G,
74    root: &Path,
75    base_override: Option<&str>,
76    fetch: bool,
77) -> Vec<Entry> {
78    // Guard the root: a non-repo (or missing) dir would otherwise pass every check
79    // vacuously. Only the root needs this — submodules come from a real repo's
80    // `git submodule status`, so they're already work trees.
81    if !is_work_tree(git, root) {
82        let reason = if root.exists() {
83            "not a git repository"
84        } else {
85            "no such directory"
86        };
87        return vec![Entry {
88            path: root.to_path_buf(),
89            status: RepoStatus::unusable(reason),
90        }];
91    }
92    let repos = collect_repos(git, root);
93    let last = repos.len().saturating_sub(1);
94    let mut slots: Vec<Option<RepoStatus>> = (0..repos.len()).map(|_| None).collect();
95
96    std::thread::scope(|scope| {
97        let mut handles = Vec::with_capacity(repos.len());
98        for (i, path) in repos.iter().enumerate() {
99            let is_root = i == last;
100            let ovr = if is_root { base_override } else { None };
101            let do_fetch = fetch && !is_root; // zsh fetches submodules, not the root
102            let path = path.clone();
103            let handle = scope.spawn(move || {
104                if do_fetch {
105                    let _ = git.run(&path, &["fetch", "--quiet"]);
106                    let _ = git.run(&path, &["remote", "prune", "origin"]);
107                }
108                let base = crate::config::resolve_base(git, &path, ovr);
109                let solo = crate::config::resolve_solo(git, &path);
110                checks::evaluate(git, &path, &base, solo)
111            });
112            handles.push((i, handle));
113        }
114        for (i, handle) in handles {
115            slots[i] = Some(handle.join().expect("gkit: a check thread panicked"));
116        }
117    });
118
119    repos
120        .into_iter()
121        .zip(slots)
122        .map(|(path, status)| Entry {
123            path,
124            status: status.expect("every slot filled"),
125        })
126        .collect()
127}
128
129#[cfg(test)]
130mod tests {
131    use super::*;
132    use crate::git::test_support::FakeGit;
133
134    #[test]
135    fn collect_repos_is_post_order_dfs() {
136        // /r has submodules a, b ; b has submodule c. Expect children before parents.
137        let git = FakeGit::new()
138            .ok_in("/r", "submodule status", " sha a (x)\n sha b (x)")
139            .ok_in("/r/a", "submodule status", "")
140            .ok_in("/r/b", "submodule status", " sha c (x)")
141            .ok_in("/r/b/c", "submodule status", "");
142        let order = collect_repos(&git, Path::new("/r"));
143        // Normalize separators: `Path::join` yields `\` on Windows, `/` elsewhere.
144        let got: Vec<String> = order
145            .iter()
146            .map(|p| p.display().to_string().replace('\\', "/"))
147            .collect();
148        assert_eq!(got, vec!["/r/a", "/r/b/c", "/r/b", "/r"]);
149    }
150
151    #[test]
152    fn non_repo_root_is_flagged_not_passed() {
153        // A root that isn't a work tree (rev-parse fails) must yield ONE entry that
154        // fails the gate — not a vacuous pass.
155        let git = FakeGit::new().fail("rev-parse --is-inside-work-tree");
156        let entries = evaluate_tree(&git, Path::new("/not/a/repo"), None, false);
157        assert_eq!(entries.len(), 1);
158        assert!(!entries[0].status.ok());
159        assert!(entries[0].status.problem.is_some());
160    }
161
162    #[test]
163    fn skips_uninitialized_submodules() {
164        let git = FakeGit::new().ok_in("/r", "submodule status", "-sha a (x)\n sha b (x)\n");
165        let subs = direct_submodules(&git, Path::new("/r"));
166        let got: Vec<String> = subs
167            .iter()
168            .map(|p| p.display().to_string().replace('\\', "/"))
169            .collect();
170        assert_eq!(got, vec!["/r/b"]); // 'a' (uninitialized, '-') skipped
171    }
172}