Skip to main content

floe_core/io/storage/providers/
local.rs

1use std::path::{Path, PathBuf};
2
3use glob::glob;
4
5use crate::errors::{RunError, StorageError};
6use crate::{config, ConfigError, FloeResult};
7
8use crate::io::storage::{planner, ObjectRef, StorageClient};
9
10pub struct LocalClient;
11
12impl LocalClient {
13    pub fn new() -> Self {
14        Self
15    }
16}
17
18impl Default for LocalClient {
19    fn default() -> Self {
20        Self::new()
21    }
22}
23
24impl StorageClient for LocalClient {
25    fn list(&self, prefix: &str) -> FloeResult<Vec<ObjectRef>> {
26        let path = Path::new(prefix);
27        if path.is_file() {
28            let uri = self.resolve_uri(prefix)?;
29            return Ok(vec![ObjectRef {
30                uri,
31                key: prefix.to_string(),
32                last_modified: None,
33                size: None,
34            }]);
35        }
36        if !path.exists() {
37            return Ok(Vec::new());
38        }
39        let mut refs = Vec::new();
40        for entry in std::fs::read_dir(path)? {
41            let entry = entry?;
42            let path = entry.path();
43            if path.is_file() {
44                let key = path.display().to_string();
45                let uri = self.resolve_uri(&key)?;
46                refs.push(ObjectRef {
47                    uri,
48                    key,
49                    last_modified: None,
50                    size: None,
51                });
52            }
53        }
54        refs = planner::stable_sort_refs(refs);
55        Ok(refs)
56    }
57
58    fn download_to_temp(&self, uri: &str, temp_dir: &Path) -> FloeResult<PathBuf> {
59        let src = PathBuf::from(uri.trim_start_matches("local://"));
60        let dest = temp_dir.join(
61            src.file_name()
62                .and_then(|name| name.to_str())
63                .unwrap_or("object"),
64        );
65        planner::ensure_parent_dir(&dest)?;
66        std::fs::copy(&src, &dest).map_err(|err| {
67            Box::new(StorageError(format!(
68                "local download failed from {}: {err}",
69                src.display()
70            ))) as Box<dyn std::error::Error + Send + Sync>
71        })?;
72        Ok(dest)
73    }
74
75    fn upload_from_path(&self, local_path: &Path, uri: &str) -> FloeResult<()> {
76        let dest = PathBuf::from(uri.trim_start_matches("local://"));
77        planner::ensure_parent_dir(&dest)?;
78        std::fs::copy(local_path, &dest).map_err(|err| {
79            Box::new(StorageError(format!(
80                "local upload failed to {}: {err}",
81                dest.display()
82            ))) as Box<dyn std::error::Error + Send + Sync>
83        })?;
84        Ok(())
85    }
86
87    fn resolve_uri(&self, path: &str) -> FloeResult<String> {
88        let path = Path::new(path);
89        let normalized = if path.is_absolute() {
90            crate::io::storage::paths::normalize_local_path(path)
91        } else {
92            let abs = std::env::current_dir()?.join(path);
93            crate::io::storage::paths::normalize_local_path(&abs)
94        };
95        Ok(format!("local://{}", normalized.display()))
96    }
97
98    fn copy_object(&self, src_uri: &str, dst_uri: &str) -> FloeResult<()> {
99        let src = Path::new(src_uri.trim_start_matches("local://"));
100        let dst = Path::new(dst_uri.trim_start_matches("local://"));
101        planner::ensure_parent_dir(dst)?;
102        std::fs::copy(src, dst).map_err(|err| {
103            Box::new(StorageError(format!(
104                "local copy failed from {} to {}: {err}",
105                src.display(),
106                dst.display()
107            ))) as Box<dyn std::error::Error + Send + Sync>
108        })?;
109        Ok(())
110    }
111
112    fn delete_object(&self, uri: &str) -> FloeResult<()> {
113        let path = Path::new(uri.trim_start_matches("local://"));
114        if path.exists() {
115            std::fs::remove_file(path).map_err(|err| {
116                Box::new(StorageError(format!(
117                    "local delete failed for {}: {err}",
118                    path.display()
119                ))) as Box<dyn std::error::Error + Send + Sync>
120            })?;
121        }
122        Ok(())
123    }
124
125    fn exists(&self, uri: &str) -> FloeResult<bool> {
126        let path = Path::new(uri.trim_start_matches("local://"));
127        Ok(path.exists())
128    }
129}
130
131#[derive(Debug, Clone, Copy, PartialEq, Eq)]
132pub enum LocalInputMode {
133    File,
134    Directory,
135}
136
137#[derive(Debug, Clone)]
138pub struct ResolvedLocalInputs {
139    pub files: Vec<PathBuf>,
140    pub mode: LocalInputMode,
141}
142
143pub fn resolve_local_inputs(
144    config_dir: &Path,
145    entity_name: &str,
146    source: &config::SourceConfig,
147    storage: &str,
148    default_globs: &[String],
149) -> FloeResult<ResolvedLocalInputs> {
150    let default_options = config::SourceOptions::default();
151    let options = source.options.as_ref().unwrap_or(&default_options);
152    let recursive = options.recursive.unwrap_or(false);
153    let glob_override = options.glob.as_deref();
154    let raw_path = source.path.as_str();
155
156    if is_glob_pattern(raw_path) {
157        let pattern_path = resolve_glob_pattern(config_dir, raw_path);
158        let pattern = pattern_path.to_string_lossy().to_string();
159        let files = collect_glob_files(&pattern)?;
160        if files.is_empty() {
161            let (base_path, glob_used) = split_glob_details(&pattern_path, raw_path);
162            return Err(Box::new(RunError(no_match_message(
163                entity_name,
164                storage,
165                &base_path,
166                &glob_used,
167                recursive,
168            ))));
169        }
170        return Ok(ResolvedLocalInputs {
171            files,
172            mode: LocalInputMode::Directory,
173        });
174    }
175
176    let base_path = config::resolve_local_path(config_dir, raw_path);
177    if base_path.is_file() {
178        return Ok(ResolvedLocalInputs {
179            files: vec![base_path],
180            mode: LocalInputMode::File,
181        });
182    }
183
184    let glob_used = if let Some(glob_override) = glob_override {
185        vec![glob_override.to_string()]
186    } else {
187        default_globs.to_vec()
188    };
189    if !base_path.is_dir() {
190        return Err(Box::new(RunError(no_match_message(
191            entity_name,
192            storage,
193            &base_path.display().to_string(),
194            &glob_used.join(","),
195            recursive,
196        ))));
197    }
198
199    let pattern_paths = if recursive {
200        glob_used
201            .iter()
202            .map(|glob| base_path.join("**").join(glob))
203            .collect::<Vec<_>>()
204    } else {
205        glob_used
206            .iter()
207            .map(|glob| base_path.join(glob))
208            .collect::<Vec<_>>()
209    };
210    let files = collect_glob_files_multi(&pattern_paths)?;
211    if files.is_empty() {
212        return Err(Box::new(RunError(no_match_message(
213            entity_name,
214            storage,
215            &base_path.display().to_string(),
216            &glob_used.join(","),
217            recursive,
218        ))));
219    }
220
221    Ok(ResolvedLocalInputs {
222        files,
223        mode: LocalInputMode::Directory,
224    })
225}
226
227fn is_glob_pattern(value: &str) -> bool {
228    value.contains('*') || value.contains('?') || value.contains('[')
229}
230
231fn resolve_glob_pattern(config_dir: &Path, raw_path: &str) -> PathBuf {
232    let path = Path::new(raw_path);
233    if path.is_absolute() {
234        path.to_path_buf()
235    } else {
236        config_dir.join(raw_path)
237    }
238}
239
240fn split_glob_details(pattern_path: &Path, raw_pattern: &str) -> (String, String) {
241    let base = pattern_path
242        .parent()
243        .unwrap_or(pattern_path)
244        .display()
245        .to_string();
246    let glob_used = pattern_path
247        .file_name()
248        .map(|name| name.to_string_lossy().to_string())
249        .unwrap_or_else(|| raw_pattern.to_string());
250    (base, glob_used)
251}
252
253fn collect_glob_files(pattern: &str) -> FloeResult<Vec<PathBuf>> {
254    let mut files = Vec::new();
255    let entries = glob(pattern).map_err(|err| {
256        Box::new(ConfigError(format!(
257            "invalid glob pattern {pattern:?}: {err}"
258        ))) as Box<dyn std::error::Error + Send + Sync>
259    })?;
260    for entry in entries {
261        let path = entry.map_err(|err| {
262            Box::new(ConfigError(format!(
263                "glob match failed for {pattern:?}: {err}"
264            ))) as Box<dyn std::error::Error + Send + Sync>
265        })?;
266        if path.is_file() {
267            files.push(crate::io::storage::paths::normalize_local_path(&path));
268        }
269    }
270    files.sort_by(|a, b| a.to_string_lossy().cmp(&b.to_string_lossy()));
271    Ok(files)
272}
273
274fn collect_glob_files_multi(patterns: &[PathBuf]) -> FloeResult<Vec<PathBuf>> {
275    let mut files = Vec::new();
276    for pattern_path in patterns {
277        let pattern = pattern_path.to_string_lossy().to_string();
278        files.extend(collect_glob_files(&pattern)?);
279    }
280    files.sort_by(|a, b| a.to_string_lossy().cmp(&b.to_string_lossy()));
281    files.dedup_by(|a, b| a.to_string_lossy() == b.to_string_lossy());
282    Ok(files)
283}
284
285fn no_match_message(
286    entity_name: &str,
287    storage: &str,
288    base_path: &str,
289    glob_used: &str,
290    recursive: bool,
291) -> String {
292    format!(
293        "entity.name={} source.storage={} no input files matched (base_path={}, glob={}, recursive={})",
294        entity_name, storage, base_path, glob_used, recursive
295    )
296}