Skip to main content

swh_graph_stdlib/
fs.rs

1// Copyright (C) 2024-2026  The Software Heritage developers
2// See the AUTHORS file at the top-level directory of this distribution
3// License: GNU General Public License version 3, or any later version
4// See top-level LICENSE file for more information
5
6//! Filesystem manipulation functions, ie. directories and contents.
7
8use std::collections::HashMap;
9
10use anyhow::{Context, Result, ensure};
11use log::warn;
12
13use swh_graph::NodeType;
14use swh_graph::graph::*;
15use swh_graph::labels::{EdgeLabel, LabelNameId, Permission};
16use swh_graph::properties;
17
18fn msg_no_label_name_id(name: impl AsRef<[u8]>) -> String {
19    format!(
20        "no label_name id found for entry \"{}\"",
21        String::from_utf8_lossy(name.as_ref())
22    )
23}
24
25/// Given a graph and a directory node, return the node id of a named directory
26/// entry located (not recursively) in that directory, if it exists.
27///
28/// See [resolve_path] for a version of this function that traverses
29/// sub-directories recursively.
30///
31/// ```ignore
32/// if let Ok(Some(node)) == resolve_name(&graph, 42, "README.md") {
33///     // do something with node
34/// }
35/// ```
36pub fn resolve_name<G>(graph: &G, dir: NodeId, name: impl AsRef<[u8]>) -> Result<Option<NodeId>>
37where
38    G: SwhLabeledForwardGraph + SwhGraphWithProperties,
39    <G as SwhGraphWithProperties>::LabelNames: properties::LabelNames,
40    <G as SwhGraphWithProperties>::Maps: properties::Maps,
41{
42    let props = graph.properties();
43    let name_id = props
44        .label_name_id(name.as_ref())
45        .with_context(|| msg_no_label_name_id(name))?;
46    resolve_name_by_id(&graph, dir, name_id)
47}
48
49/// Same as [resolve_name], but using a pre-resolved [LabelNameId] as entry
50/// name. Using this function is more efficient in case the same name (e.g.,
51/// "README.md") is to be looked up in many directories.
52pub fn resolve_name_by_id<G>(graph: &G, dir: NodeId, name: LabelNameId) -> Result<Option<NodeId>>
53where
54    G: SwhLabeledForwardGraph + SwhGraphWithProperties,
55    <G as SwhGraphWithProperties>::Maps: properties::Maps,
56{
57    let node_type = graph.properties().node_type(dir);
58    ensure!(
59        node_type == NodeType::Directory,
60        "Type of {dir} should be dir, but is {node_type} instead"
61    );
62
63    for (succ, label) in graph.labeled_successors(dir).flatten_labels() {
64        #[allow(clippy::collapsible_if)]
65        if let EdgeLabel::DirEntry(dentry) = label {
66            if dentry.label_name_id() == name {
67                return Ok(Some(succ));
68            }
69        }
70    }
71    Ok(None)
72}
73
74/// Given a graph and a directory node, return the node id of a directory entry
75/// located at a given path within that directory, if it exists.
76///
77/// Slashes (`/`) contained in `path` are interpreted as path separators.
78///
79/// See [resolve_name] for a non-recursive version of this function.
80///
81/// ```ignore
82/// if let Ok(Some(node)) == resolve_path(&graph, 42, "src/main.c") {
83///     // do something with node
84/// }
85/// ```
86pub fn resolve_path<G>(graph: &G, dir: NodeId, path: impl AsRef<[u8]>) -> Result<Option<NodeId>>
87where
88    G: SwhLabeledForwardGraph + SwhGraphWithProperties,
89    <G as SwhGraphWithProperties>::LabelNames: properties::LabelNames,
90    <G as SwhGraphWithProperties>::Maps: properties::Maps,
91{
92    let props = graph.properties();
93    let path = path
94        .as_ref()
95        .split(|byte| *byte == b'/')
96        .map(|name| {
97            props
98                .label_name_id(name)
99                .with_context(|| msg_no_label_name_id(name))
100        })
101        .collect::<Result<Vec<LabelNameId>, _>>()?;
102    resolve_path_by_id(&graph, dir, &path)
103}
104
105/// Same as [resolve_path], but using as path a sequence of pre-resolved
106/// [LabelNameId]-s. Using this function is more efficient in case the same path
107/// (e.g., "src/main.c") is to be looked up in many directories.
108pub fn resolve_path_by_id<G>(graph: &G, dir: NodeId, path: &[LabelNameId]) -> Result<Option<NodeId>>
109where
110    G: SwhLabeledForwardGraph + SwhGraphWithProperties,
111    <G as SwhGraphWithProperties>::Maps: properties::Maps,
112{
113    let mut cur_entry = dir;
114    for name in path {
115        match resolve_name_by_id(graph, cur_entry, *name)? {
116            None => return Ok(None),
117            Some(entry) => cur_entry = entry,
118        }
119    }
120    Ok(Some(cur_entry))
121}
122
123/// Recursive representation of a directory tree, ignoring sharing.
124///
125/// Note that a `Revision` variant can in fact point to either revision or
126/// release nodes.
127#[derive(Debug, Default, PartialEq)]
128pub enum FsTree {
129    #[default]
130    Content,
131    Directory(HashMap<Vec<u8>, (FsTree, Option<Permission>)>),
132    Revision(NodeId),
133}
134
135/// Given a graph and a directory node in it (usually, but not necessarily, the
136/// *root* directory of a repository), return a recursive list of the contained
137/// files and directories.
138///
139/// Note that symlinks are not followed during listing and are reported as
140/// files in the returned tree. To recognize them as links, check the
141/// permissions of the associated directory entries.
142pub fn ls_tree<G>(graph: &G, dir: NodeId) -> Result<FsTree>
143where
144    G: SwhLabeledForwardGraph + SwhGraphWithProperties,
145    <G as SwhGraphWithProperties>::LabelNames: properties::LabelNames,
146    <G as SwhGraphWithProperties>::Maps: properties::Maps,
147{
148    let props = graph.properties();
149    let node_type = props.node_type(dir);
150    ensure!(
151        node_type == NodeType::Directory,
152        "Type of {dir} should be dir, but is {node_type} instead"
153    );
154
155    let mut dir_entries = HashMap::new();
156    for (succ, labels) in graph.labeled_successors(dir) {
157        let node_type = props.node_type(succ);
158        for label in labels {
159            if let EdgeLabel::DirEntry(dentry) = label {
160                let file_name = props.label_name(dentry.label_name_id());
161                let perm = dentry.permission();
162                match node_type {
163                    NodeType::Content => {
164                        dir_entries.insert(file_name, (FsTree::Content, perm));
165                    }
166                    NodeType::Directory => {
167                        // recurse into subdir
168                        if let Ok(subdir) = ls_tree(graph, succ) {
169                            dir_entries.insert(file_name, (subdir, perm));
170                        } else {
171                            warn!("Cannot list (sub-)directory {succ}, skipping it");
172                        }
173                    }
174                    NodeType::Revision | NodeType::Release => {
175                        dir_entries.insert(file_name, (FsTree::Revision(succ), perm));
176                    }
177                    NodeType::Origin | NodeType::Snapshot => {
178                        warn!("Ignoring dir entry with unexpected type {node_type}");
179                    }
180                }
181            }
182        }
183    }
184
185    Ok(FsTree::Directory(dir_entries))
186}