Skip to main content

cargo_coupling/
workspace.rs

1//! Workspace analysis using cargo metadata
2//!
3//! This module uses `cargo metadata` to understand the project structure,
4//! including workspace members, dependencies, and module organization.
5
6use std::collections::{HashMap, HashSet};
7use std::path::{Path, PathBuf};
8
9use cargo_metadata::{Metadata, MetadataCommand, PackageId};
10use thiserror::Error;
11
12/// Errors that can occur during workspace analysis
13#[derive(Error, Debug)]
14pub enum WorkspaceError {
15    #[error("Failed to run cargo metadata: {0}")]
16    MetadataError(#[from] cargo_metadata::Error),
17
18    #[error("Package not found: {0}")]
19    PackageNotFound(String),
20
21    #[error("Invalid manifest path: {0}")]
22    InvalidManifest(String),
23}
24
25/// Information about a crate in the workspace
26#[derive(Debug, Clone)]
27pub struct CrateInfo {
28    /// Crate name
29    pub name: String,
30    /// Package ID for dependency resolution
31    pub id: PackageId,
32    /// Path to the crate's source directory
33    pub src_path: PathBuf,
34    /// Path to Cargo.toml
35    pub manifest_path: PathBuf,
36    /// Direct dependencies (crate names)
37    pub dependencies: Vec<String>,
38    /// Dev dependencies
39    pub dev_dependencies: Vec<String>,
40    /// Is this a workspace member?
41    pub is_workspace_member: bool,
42}
43
44/// Information about the entire workspace
45#[derive(Debug)]
46pub struct WorkspaceInfo {
47    /// Root directory of the workspace
48    pub root: PathBuf,
49    /// All crates in the workspace
50    pub crates: HashMap<String, CrateInfo>,
51    /// Workspace members (crate names)
52    pub members: Vec<String>,
53    /// Dependency graph: crate name -> dependencies
54    pub dependency_graph: HashMap<String, HashSet<String>>,
55    /// Reverse dependency graph: crate name -> dependents
56    pub reverse_deps: HashMap<String, HashSet<String>>,
57}
58
59impl WorkspaceInfo {
60    /// Analyze a workspace from a path
61    pub fn from_path(path: &Path) -> Result<Self, WorkspaceError> {
62        // Find Cargo.toml
63        let manifest_path = find_cargo_toml(path)?;
64
65        // Run cargo metadata
66        let metadata = MetadataCommand::new()
67            .manifest_path(&manifest_path)
68            .exec()?;
69
70        Self::from_metadata(metadata)
71    }
72
73    /// Create workspace info from cargo metadata
74    pub fn from_metadata(metadata: Metadata) -> Result<Self, WorkspaceError> {
75        let root = metadata.workspace_root.as_std_path().to_path_buf();
76
77        let mut crates = HashMap::new();
78        let mut members = Vec::new();
79        let mut dependency_graph: HashMap<String, HashSet<String>> = HashMap::new();
80        let mut reverse_deps: HashMap<String, HashSet<String>> = HashMap::new();
81
82        // Collect workspace members
83        let workspace_member_ids: HashSet<_> = metadata.workspace_members.iter().collect();
84
85        // Process all packages
86        for package in &metadata.packages {
87            let is_workspace_member = workspace_member_ids.contains(&package.id);
88
89            if is_workspace_member {
90                members.push(package.name.clone());
91            }
92
93            // Get source directory
94            let src_path = package
95                .manifest_path
96                .parent()
97                .map(|p| p.as_std_path().join("src"))
98                .unwrap_or_default();
99
100            // Collect dependencies
101            let mut deps = Vec::new();
102            let mut dev_deps = Vec::new();
103
104            for dep in &package.dependencies {
105                if dep.kind == cargo_metadata::DependencyKind::Development {
106                    dev_deps.push(dep.name.clone());
107                } else {
108                    deps.push(dep.name.clone());
109                }
110
111                // Build dependency graph
112                dependency_graph
113                    .entry(package.name.clone())
114                    .or_default()
115                    .insert(dep.name.clone());
116
117                // Build reverse dependency graph
118                reverse_deps
119                    .entry(dep.name.clone())
120                    .or_default()
121                    .insert(package.name.clone());
122            }
123
124            let crate_info = CrateInfo {
125                name: package.name.clone(),
126                id: package.id.clone(),
127                src_path,
128                manifest_path: package.manifest_path.as_std_path().to_path_buf(),
129                dependencies: deps,
130                dev_dependencies: dev_deps,
131                is_workspace_member,
132            };
133
134            crates.insert(package.name.clone(), crate_info);
135        }
136
137        Ok(Self {
138            root,
139            crates,
140            members,
141            dependency_graph,
142            reverse_deps,
143        })
144    }
145
146    /// Get a crate by name
147    pub fn get_crate(&self, name: &str) -> Option<&CrateInfo> {
148        self.crates.get(name)
149    }
150
151    /// Check if a crate is a workspace member
152    pub fn is_workspace_member(&self, name: &str) -> bool {
153        self.members.contains(&name.to_string())
154    }
155
156    /// Get direct dependencies of a crate
157    pub fn get_dependencies(&self, name: &str) -> Option<&HashSet<String>> {
158        self.dependency_graph.get(name)
159    }
160
161    /// Get crates that depend on this crate
162    pub fn get_dependents(&self, name: &str) -> Option<&HashSet<String>> {
163        self.reverse_deps.get(name)
164    }
165
166    /// Calculate the distance between two crates
167    /// Returns None if there's no path, 0 if same crate, 1 for direct dep, etc.
168    pub fn crate_distance(&self, from: &str, to: &str) -> Option<usize> {
169        if from == to {
170            return Some(0);
171        }
172
173        // Direct dependency check
174        if self
175            .dependency_graph
176            .get(from)
177            .is_some_and(|deps| deps.contains(to))
178        {
179            return Some(1);
180        }
181
182        // BFS for longer paths
183        let mut visited = HashSet::new();
184        let mut queue = vec![(from.to_string(), 0usize)];
185
186        while let Some((current, dist)) = queue.pop() {
187            if visited.contains(&current) {
188                continue;
189            }
190            visited.insert(current.clone());
191
192            if let Some(deps) = self.dependency_graph.get(&current) {
193                for dep in deps {
194                    if dep == to {
195                        return Some(dist + 1);
196                    }
197                    if !visited.contains(dep) {
198                        queue.push((dep.clone(), dist + 1));
199                    }
200                }
201            }
202        }
203
204        None
205    }
206
207    /// Get all source files for workspace members
208    pub fn get_all_source_files(&self) -> Vec<PathBuf> {
209        let mut files = Vec::new();
210
211        for member in &self.members {
212            if let Some(crate_info) = self.crates.get(member)
213                && crate_info.src_path.exists()
214            {
215                for entry in walkdir::WalkDir::new(&crate_info.src_path)
216                    .follow_links(true)
217                    .into_iter()
218                    .filter_map(|e| e.ok())
219                {
220                    let path = entry.path();
221                    if path.extension().is_some_and(|ext| ext == "rs") {
222                        files.push(path.to_path_buf());
223                    }
224                }
225            }
226        }
227
228        files
229    }
230}
231
232/// Find Cargo.toml by walking up from the given path
233fn find_cargo_toml(start: &Path) -> Result<PathBuf, WorkspaceError> {
234    let mut current = if start.is_file() {
235        start.parent().map(|p| p.to_path_buf())
236    } else {
237        Some(start.to_path_buf())
238    };
239
240    while let Some(dir) = current {
241        let cargo_toml = dir.join("Cargo.toml");
242        if cargo_toml.exists() {
243            return Ok(cargo_toml);
244        }
245        current = dir.parent().map(|p| p.to_path_buf());
246    }
247
248    Err(WorkspaceError::InvalidManifest(start.display().to_string()))
249}
250
251/// Resolve a module path to a crate name
252/// e.g., "crate::models::user" in package "my-app" -> "my-app"
253/// e.g., "serde::Serialize" -> "serde"
254pub fn resolve_crate_from_path(
255    use_path: &str,
256    current_crate: &str,
257    workspace: &WorkspaceInfo,
258) -> Option<String> {
259    let parts: Vec<&str> = use_path.split("::").collect();
260
261    if parts.is_empty() {
262        return None;
263    }
264
265    match parts[0] {
266        "crate" | "self" | "super" => {
267            // Internal reference to current crate
268            Some(current_crate.to_string())
269        }
270        first_segment => {
271            // Check if it's a known crate
272            // Convert hyphens to underscores for crate names
273            let normalized = first_segment.replace('-', "_");
274
275            // Check workspace members first
276            for member in &workspace.members {
277                let member_normalized = member.replace('-', "_");
278                if member_normalized == normalized {
279                    return Some(member.clone());
280                }
281            }
282
283            // Check all crates
284            for name in workspace.crates.keys() {
285                let name_normalized = name.replace('-', "_");
286                if name_normalized == normalized {
287                    return Some(name.clone());
288                }
289            }
290
291            // Assume it's an external crate
292            Some(first_segment.to_string())
293        }
294    }
295}
296
297#[cfg(test)]
298mod tests {
299    use super::*;
300
301    #[test]
302    fn test_find_cargo_toml() {
303        // Test in the current project
304        let result = find_cargo_toml(Path::new("."));
305        assert!(result.is_ok());
306        assert!(result.unwrap().ends_with("Cargo.toml"));
307    }
308
309    #[test]
310    fn test_resolve_crate_from_path() {
311        let workspace = WorkspaceInfo {
312            root: PathBuf::new(),
313            crates: HashMap::new(),
314            members: vec!["my-app".to_string(), "my-lib".to_string()],
315            dependency_graph: HashMap::new(),
316            reverse_deps: HashMap::new(),
317        };
318
319        // Internal reference
320        assert_eq!(
321            resolve_crate_from_path("crate::models::User", "my-app", &workspace),
322            Some("my-app".to_string())
323        );
324
325        // Workspace member reference
326        assert_eq!(
327            resolve_crate_from_path("my_lib::utils", "my-app", &workspace),
328            Some("my-lib".to_string())
329        );
330
331        // External crate
332        assert_eq!(
333            resolve_crate_from_path("serde::Serialize", "my-app", &workspace),
334            Some("serde".to_string())
335        );
336    }
337}