use crate::linter::{Diagnostic, LintResult, Severity, Span};
use regex::Regex;
static FOR_FIND_LOOP: std::sync::LazyLock<Regex> = std::sync::LazyLock::new(|| {
Regex::new(r"for\s+\w+\s+in\s+(?:\$\(|`)find\s+").unwrap()
});
pub fn check(source: &str) -> LintResult {
let mut result = LintResult::new();
for (line_num, line) in source.lines().enumerate() {
let line_num = line_num + 1;
if line.trim_start().starts_with('#') {
continue;
}
if FOR_FIND_LOOP.is_match(line) {
if let Some(mat) = FOR_FIND_LOOP.find(line) {
let pos = mat.start();
let before = &line[..pos];
let quote_count = before.matches('"').count() + before.matches('\'').count();
if quote_count % 2 == 1 {
continue;
}
let start_col = pos + 1;
let end_col = mat.end() + 1;
let diagnostic = Diagnostic::new(
"SC2038",
Severity::Warning,
"Use find -exec or -print0/-0 instead of for loop over find output. Filenames with spaces/newlines will break.".to_string(),
Span::new(line_num, start_col, line_num, end_col),
);
result.add(diagnostic);
}
}
}
result
}
#[cfg(test)]
mod tests {
use super::*;
#[test]
fn test_sc2038_for_find_command_subst() {
let code = r#"for file in $(find . -name "*.txt"); do echo "$file"; done"#;
let result = check(code);
assert_eq!(result.diagnostics.len(), 1);
assert_eq!(result.diagnostics[0].code, "SC2038");
assert_eq!(result.diagnostics[0].severity, Severity::Warning);
assert!(result.diagnostics[0].message.contains("-print0"));
}
#[test]
fn test_sc2038_for_find_backticks() {
let code = r#"for f in `find . -type f`; do rm "$f"; done"#;
let result = check(code);
assert_eq!(result.diagnostics.len(), 1);
}
#[test]
fn test_sc2038_find_exec_ok() {
let code = r#"find . -name "*.txt" -exec echo {} +"#;
let result = check(code);
assert_eq!(result.diagnostics.len(), 0);
}
#[test]
fn test_sc2038_find_print0_ok() {
let code = r#"find . -name "*.txt" -print0 | while IFS= read -r -d '' file; do echo "$file"; done"#;
let result = check(code);
assert_eq!(result.diagnostics.len(), 0);
}
#[test]
fn test_sc2038_regular_for_ok() {
let code = r#"for file in *.txt; do echo "$file"; done"#;
let result = check(code);
assert_eq!(result.diagnostics.len(), 0);
}
#[test]
fn test_sc2038_in_quotes_ok() {
let code = r#"echo "for file in $(find . -name '*.txt')""#;
let result = check(code);
assert_eq!(result.diagnostics.len(), 0);
}
#[test]
fn test_sc2038_comment_ok() {
let code = r#"# for file in $(find . -name "*.txt"); do"#;
let result = check(code);
assert_eq!(result.diagnostics.len(), 0);
}
#[test]
fn test_sc2038_multiline_find() {
let code = r#"
for item in $(find /var/log \
-name "*.log"); do
cat "$item"
done
"#;
let result = check(code);
assert_eq!(result.diagnostics.len(), 1);
}
#[test]
fn test_sc2038_while_read_ok() {
let code = r#"while IFS= read -r line; do echo "$line"; done < <(find . -type f)"#;
let result = check(code);
assert_eq!(result.diagnostics.len(), 0);
}
#[test]
fn test_sc2038_array_assignment() {
let code = r#"files=($(find . -name "*.sh"))"#;
let result = check(code);
assert_eq!(result.diagnostics.len(), 0);
}
}