Skip to main content

kaish_glob/
lib.rs

1//! kaish-glob: Glob matching and async file walking.
2//!
3//! Provides:
4//! - **glob_match**: Shell-style glob pattern matching with brace expansion
5//! - **GlobPath**: Path-aware glob matching with `**` (globstar) support
6//! - **FileWalker**: Async recursive directory walker, generic over `WalkerFs`
7//! - **IgnoreFilter**: Gitignore-style pattern filtering
8//! - **IncludeExclude**: rsync-style include/exclude filters
9//!
10//! The walker is generic over `WalkerFs`, a minimal read-only filesystem trait.
11//! Consumers implement `WalkerFs` to adapt their own filesystem abstraction.
12
13mod filter;
14pub mod glob;
15mod glob_path;
16mod ignore;
17mod walker;
18
19pub use filter::{FilterResult, IncludeExclude};
20pub use glob::{contains_glob, expand_braces, glob_match};
21pub use glob_path::{GlobPath, PathSegment, PatternError};
22pub use ignore::IgnoreFilter;
23pub use walker::{EntryTypes, ErrorCallback, FileWalker, WalkOptions};
24
25use async_trait::async_trait;
26use std::path::{Path, PathBuf};
27use thiserror::Error;
28
29/// Errors from filesystem operations within the walker.
30#[derive(Debug, Error)]
31pub enum WalkerError {
32    #[error("not found: {0}")]
33    NotFound(String),
34    #[error("permission denied: {0}")]
35    PermissionDenied(String),
36    #[error("io error: {0}")]
37    Io(String),
38    #[error("symlink cycle detected: {0}")]
39    SymlinkCycle(String),
40}
41
42/// Minimal read-only filesystem abstraction for the walker.
43///
44/// Implement this trait to adapt your project's filesystem layer
45/// (VFS, real FS, CRDT blocks, etc.) to `FileWalker` and `IgnoreFilter`.
46#[async_trait]
47pub trait WalkerFs: Send + Sync {
48    /// The directory entry type returned by `list_dir`.
49    type DirEntry: WalkerDirEntry;
50
51    /// List the entries in a directory.
52    async fn list_dir(&self, path: &Path) -> Result<Vec<Self::DirEntry>, WalkerError>;
53
54    /// Read the full contents of a file into memory.
55    ///
56    /// Currently used for loading `.gitignore` files. Implementations SHOULD
57    /// impose a reasonable size limit to prevent accidental multi-gigabyte reads.
58    async fn read_file(&self, path: &Path) -> Result<Vec<u8>, WalkerError>;
59
60    /// Check if a path is a directory.
61    async fn is_dir(&self, path: &Path) -> bool;
62
63    /// Check if a path exists.
64    async fn exists(&self, path: &Path) -> bool;
65
66    /// Return the canonical (resolved) path, following symlinks.
67    ///
68    /// Used by `FileWalker` for symlink cycle detection when `follow_symlinks`
69    /// is enabled. Implementations that support symlinks should resolve the path
70    /// to its real location. The default returns the path unchanged.
71    async fn canonicalize(&self, path: &Path) -> PathBuf {
72        path.to_path_buf()
73    }
74
75    /// Return the file size in bytes, or `None` if size cannot be determined.
76    ///
77    /// Used by `FileWalker` to honor `WalkOptions::max_filesize`.
78    /// Implementations that don't know file sizes (or for which a size query
79    /// is too expensive) may return `None` — the walker treats that as
80    /// "unknown size" and yields the file regardless of the limit.
81    async fn file_size(&self, _path: &Path) -> Option<u64> {
82        None
83    }
84}
85
86/// A single entry returned by `WalkerFs::list_dir`.
87pub trait WalkerDirEntry: Send {
88    /// The entry name (file or directory name, not full path).
89    fn name(&self) -> &str;
90
91    /// True if this entry is a directory.
92    fn is_dir(&self) -> bool;
93
94    /// True if this entry is a regular file.
95    fn is_file(&self) -> bool;
96
97    /// True if this entry is a symbolic link.
98    fn is_symlink(&self) -> bool;
99}