hunch 2.0.2 - Docs.rs

//! Title string cleaning — composed from small, single-purpose transforms.
//!
//! ## Design
//!
//! Title cleaning is a pipeline. Each step does *one* thing and returns a
//! `String`. The public entry points (`clean_title`, `clean_episode_title`,
//! `clean_title_preserve_dashes`) compose these steps.
//!
//! Steps (in pipeline order):
//!
//! 1. [`strip_leading_brackets`] — drop `[XCT]`, `[阿维达]`, ... at the start.
//! 2. [`strip_paren_year`] — drop a trailing `(YYYY)`.
//! 3. [`strip_paren_groups`] — drop all `(...)` groups, with empty fallback.
//! 4. [`normalize_separators`] — convert `.`, `_`, `+`, brackets, `*` to
//!    spaces. Dash handling is parameterized by [`DashPolicy`].
//! 5. [`trim_trailing_punct`] — drop stray `:-,;` at the end.
//! 6. [`strip_trailing_keywords`] — drop trailing `Part N`, `Season N`,
//!    `Episode`, `-xNN` bonus markers (caller opt-in).
//!
//! See `D10: Refactor before accreting` in `DESIGN.md` — this module
//! exists because we hit the "2nd cleaning mode + bool flag" tripwire.

use super::{BRACKETS, SEPS};

use std::sync::LazyLock;

// ── Public composers ───────────────────────────────────────────────────────

/// Standard title cleaning: separators → spaces, brackets stripped,
/// trailing `Part N` / `Season N` / bonus markers removed.
pub(super) fn clean_title(raw: &str) -> String {
    let s = strip_leading_brackets(raw);
    let s = strip_paren_year(&s);
    let s = strip_paren_groups(&s);
    let s = normalize_separators(&s, DashPolicy::WordDashOnly);
    let s = trim_trailing_punct(&s);
    strip_trailing_keywords(&s)
}

/// Episode-title cleaning: same as [`clean_title`] but keeps trailing
/// `Part N` / `Season N` (those words are valid episode-title content)
/// and trims leading separator junk first.
pub(super) fn clean_episode_title(raw: &str) -> String {
    let trimmed = raw.trim_start_matches(['.', '_', ' ', '-']);
    let s = strip_leading_brackets(trimmed);
    let s = strip_paren_year(&s);
    let s = strip_paren_groups(&s);
    let s = normalize_separators(&s, DashPolicy::WordDashOnly);
    trim_trailing_punct(&s)
}

/// Clean a raw title while preserving internal `" - "` (and equivalents
/// `_-_`, `.-.`) as literal `" - "` separators, and without stripping
/// trailing `Part N` keywords.
///
/// Use this when the title boundary has already been correctly identified
/// by upstream logic (e.g., anime bracket releases
/// `[Group] Show - Sub Part 2 - 13 [tags]`) and the dashes / `Part N`
/// are genuinely part of the title.
///
/// Composition: same pipeline as [`clean_title`] but with
/// [`DashPolicy::PreserveStructuralDash`] and no trailing-keyword strip.
pub(super) fn clean_title_preserve_dashes(raw: &str) -> String {
    let s = strip_leading_brackets(raw);
    let s = strip_paren_year(&s);
    let s = strip_paren_groups(&s);
    let s = normalize_separators(&s, DashPolicy::PreserveStructuralDash);
    trim_trailing_punct(&s)
}

// ── DashPolicy ─────────────────────────────────────────────────────────────

/// How [`normalize_separators`] handles `-` characters.
#[derive(Debug, Clone, Copy, PartialEq, Eq)]
pub(super) enum DashPolicy {
    /// Keep `-` only between alphanumerics (e.g. `Spider-Man`); convert
    /// every other dash to a space. This is the standard mode used by
    /// [`clean_title`] and [`clean_episode_title`].
    WordDashOnly,
    /// Keep `-` between alphanumerics, AND preserve a separator-flanked
    /// dash (e.g. `_-_`, ` - `, `.-.`) as a literal ` - ` (space-dash-space)
    /// in the output. Used when the structural separator carries title
    /// content that would otherwise be lost (anime
    /// `[Group] Title - Sub - Ep [tags]` where `Sub` belongs to the title).
    PreserveStructuralDash,
}

// ── Step 1: leading brackets ───────────────────────────────────────────────

/// Strip `[…]` groups at the start (and any trailing separators) until the
/// string no longer begins with `[`.
pub(super) fn strip_leading_brackets(raw: &str) -> String {
    let mut s = raw.to_string();
    while s.starts_with('[') {
        if let Some(end) = s.find(']') {
            s = s[end + 1..].to_string();
            s = s.trim_start_matches(SEPS).to_string();
        } else {
            break;
        }
    }
    s
}

// ── Step 2: trailing parenthesized year ────────────────────────────────────

static RE_PAREN_YEAR: LazyLock<regex::Regex> = LazyLock::new(|| {
    regex::Regex::new(r"\s*\((?:19|20)\d{2}\)\s*$").expect("RE_PAREN_YEAR regex is valid")
});

/// Strip a trailing `(YYYY)`: `Movie Name (2005)` → `Movie Name`.
pub(super) fn strip_paren_year(s: &str) -> String {
    if let Some(m) = RE_PAREN_YEAR.find(s) {
        s[..m.start()].to_string()
    } else {
        s.to_string()
    }
}

// ── Step 3: parenthesized groups ───────────────────────────────────────────

static RE_PAREN_GROUP: LazyLock<regex::Regex> =
    LazyLock::new(|| regex::Regex::new(r"\s*\([^)]*\)\s*").expect("RE_PAREN_GROUP regex is valid"));

/// Strip all `(...)` groups (alternative titles, country tags, etc.).
///
/// If stripping would empty the string, the original is returned — a title
/// that is *only* a parenthesized phrase is better than nothing.
pub(super) fn strip_paren_groups(s: &str) -> String {
    let stripped = RE_PAREN_GROUP.replace_all(s, " ").into_owned();
    if stripped.trim().is_empty() {
        s.to_string()
    } else {
        stripped
    }
}

// ── Step 4: separator normalization ────────────────────────────────────────

static RE_DOT_ACRONYM: LazyLock<regex::Regex> = LazyLock::new(|| {
    regex::Regex::new(r"(?:^|[\s._])([A-Za-z0-9](?:\.[A-Za-z0-9]){2,}\.?)")
        .expect("RE_DOT_ACRONYM regex is valid")
});

// ── Helpers extracted from `normalize_separators` (#146 mutant kills) ──
//
// Both helpers are pure value-in / value-out predicates that pin
// surviving boundary mutants from the 2026-04-19 nightly run. They
// live as free functions (rather than closures inside the body) so the
// unit tests in this module can exercise them directly.

/// True when a dot-acronym regex match begins AT a separator byte that
/// should be excluded from the protected range.
///
/// The regex `(?:^|[\s._])([A-Za-z0-9](?:\.[A-Za-z0-9]){2,}\.?)` may
/// capture a leading separator (space/tab/dot/underscore); when it
/// does, the caller advances `actual_start` by one byte to skip it.
///
/// Returns `false` when `match_start == 0` (no leading byte to inspect)
/// or when the byte at `match_start` isn't one of the four separators.
fn acronym_match_starts_at_separator(input: &str, match_start: usize) -> bool {
    match_start > 0 && matches!(input.as_bytes()[match_start], b' ' | b'\t' | b'.' | b'_')
}

/// True when `pos` falls inside any of the half-open `[start, end)`
/// byte ranges. Used to decide whether a `.` at byte position `pos`
/// lies within a protected dot-acronym span.
fn position_in_any_range(pos: usize, ranges: &[(usize, usize)]) -> bool {
    ranges.iter().any(|(s, e)| pos >= *s && pos < *e)
}

/// Replace separators (`.`, `_`, `+`, brackets, `*`) with spaces, with
/// dash handling controlled by [`DashPolicy`].
///
/// Preserves dot-acronyms like `S.H.I.E.L.D.` by computing protected
/// byte ranges before the per-char rewrite.
pub(super) fn normalize_separators(s: &str, dash: DashPolicy) -> String {
    // Find dot-acronym byte ranges to protect from dot→space conversion.
    let protected_ranges: Vec<(usize, usize)> = RE_DOT_ACRONYM
        .find_iter(s)
        .map(|m| {
            let actual_start = if acronym_match_starts_at_separator(s, m.start()) {
                m.start() + 1
            } else {
                m.start()
            };
            (actual_start, m.end())
        })
        .collect();

    let in_protected = |pos: usize| -> bool { position_in_any_range(pos, &protected_ranges) };

    let chars: Vec<char> = s.chars().collect();
    let mut byte_positions: Vec<usize> = Vec::with_capacity(chars.len());
    let mut byte_pos = 0;
    for &c in &chars {
        byte_positions.push(byte_pos);
        byte_pos += c.len_utf8();
    }

    let mut out = String::with_capacity(s.len());
    for (i, &c) in chars.iter().enumerate() {
        match c {
            '-' => {
                let kind = classify_dash(&chars, i);
                match (kind, dash) {
                    (DashKind::WordDash, _) => out.push('-'),
                    (DashKind::SeparatorFlanked, DashPolicy::PreserveStructuralDash) => {
                        // Collapse any trailing space we just emitted so we
                        // don't get "  - " / " -  ". `collapse_spaces` at the
                        // end will normalize any remaining doubles, but emit
                        // exactly " - " here for clarity.
                        if out.ends_with(' ') {
                            out.pop();
                        }
                        out.push_str(" - ");
                    }
                    _ => out.push(' '),
                }
            }
            '.' if in_protected(byte_positions[i]) => out.push('.'),
            ch if SEPS.contains(&ch) || BRACKETS.contains(&ch) || ch == '*' => out.push(' '),
            ch => out.push(ch),
        }
    }
    collapse_spaces(&out)
}

/// Classification of a `-` character based on the chars immediately
/// surrounding it.
#[derive(Debug, Clone, Copy, PartialEq, Eq)]
enum DashKind {
    /// Both neighbors are alphanumerics. Always preserved as `-`
    /// regardless of policy. Example: `Spider-Man`.
    WordDash,
    /// Both neighbors are filename separators (`.`, `_`, `+`, ` `). This
    /// is the structural " - " form. Preserved by
    /// [`DashPolicy::PreserveStructuralDash`], collapsed otherwise.
    SeparatorFlanked,
    /// Anything else (start/end of string, mixed neighbors, brackets, ...).
    /// Always collapsed to a space.
    Other,
}

fn classify_dash(chars: &[char], i: usize) -> DashKind {
    let prev = if i > 0 { Some(chars[i - 1]) } else { None };
    let next = chars.get(i + 1).copied();
    let is_alnum = |c: Option<char>| c.is_some_and(|c| c.is_alphanumeric());
    let is_sep = |c: Option<char>| c.is_some_and(|c| SEPS.contains(&c));
    if is_alnum(prev) && is_alnum(next) {
        DashKind::WordDash
    } else if is_sep(prev) && is_sep(next) {
        DashKind::SeparatorFlanked
    } else {
        DashKind::Other
    }
}

// (legacy `rewrite_dash` removed — logic now lives in `classify_dash`
//  + the per-char match in `normalize_separators`.)

// ── Step 5: trailing punctuation ───────────────────────────────────────────

/// Strip trailing punctuation that leaks from separator boundaries.
pub(super) fn trim_trailing_punct(s: &str) -> String {
    s.trim_end_matches([':', '-', ',', ';']).trim().to_string()
}

// ── Step 6: trailing keywords ──────────────────────────────────────────────

static RE_TRAILING_PART: LazyLock<regex::Regex> = LazyLock::new(|| {
    regex::Regex::new(r"(?i)\s+Part\s*(?:I{1,4}|IV|VI{0,3}|IX|X{0,3}|[0-9]+)?\s*$")
        .expect("RE_TRAILING_PART regex is valid")
});

static RE_TRAILING_SEASON: LazyLock<regex::Regex> = LazyLock::new(|| {
    // Matches trailing season tokens in two flavors:
    //   1. Long form: `Season 2`, `Saison 2`, `Stagione II`, `Temporada 3 & 4`, ...
    //   2. Short form: `S2`, `S03`, `S10` (anime fansub convention).
    //
    // The short form is anchored with `\b` and bounded to 1-3 digits so it
    // doesn't eat trailing words like `Inus` (which ends in `s`) or `Spider-Man`.
    regex::Regex::new(
        r"(?i)\s+(?:S\d{1,3}|(?:Saison|Temporada|Stagione|Tem\.?|Season|Seasons?)\s*(?:I{1,4}|IV|VI{0,3}|IX|X{0,3}|[0-9]+)?(?:\s*(?:&|and)\s*(?:I{1,4}|IV|VI{0,3}|IX|X{0,3}|[0-9]+))?)\s*$"
    ).expect("RE_TRAILING_SEASON regex is valid")
});

static RE_TRAILING_EP: LazyLock<regex::Regex> = LazyLock::new(|| {
    regex::Regex::new(r"(?i)\s+(?:Episodes?|Ep\.?)\s*$").expect("RE_TRAILING_EP regex is valid")
});

static RE_TRAILING_BONUS: LazyLock<regex::Regex> = LazyLock::new(|| {
    regex::Regex::new(r"(?i)[-]x\d{1,3}\s*$").expect("RE_TRAILING_BONUS regex is valid")
});

/// Strip trailing `Part`, `Season`, `Episode` keywords and `-xNN` bonus
/// markers from titles. Each strip is skipped if it would empty the title.
pub(super) fn strip_trailing_keywords(input: &str) -> String {
    let mut s = input.to_string();
    s = strip_if_nonempty(&s, &RE_TRAILING_PART);
    s = strip_if_nonempty(&s, &RE_TRAILING_SEASON);
    s = strip_if_nonempty(&s, &RE_TRAILING_EP);
    s = strip_if_nonempty(&s, &RE_TRAILING_BONUS);
    s
}

fn strip_if_nonempty(s: &str, re: &regex::Regex) -> String {
    if let Some(m) = re.find(s) {
        let stripped = &s[..m.start()];
        if !stripped.trim().is_empty() {
            return stripped.to_string();
        }
    }
    s.to_string()
}

// ── Whitespace utilities (used by other modules in the title subsystem) ───

/// Collapse multiple spaces into one and trim.
pub(super) fn collapse_spaces(s: &str) -> String {
    let mut result = String::with_capacity(s.len());
    let mut prev_space = true;
    for c in s.chars() {
        if c == ' ' {
            if !prev_space {
                result.push(' ');
            }
            prev_space = true;
        } else {
            result.push(c);
            prev_space = false;
        }
    }
    result.trim().to_string()
}

/// Strip a file extension from the end of a string.
pub(super) fn strip_extension(s: &str) -> &str {
    if let Some(dot) = s.rfind('.') {
        let ext = &s[dot + 1..];
        let ext_lower = ext.to_lowercase();
        if ext.len() <= 5 && is_likely_extension(&ext_lower) {
            return &s[..dot];
        }
    }
    s
}

/// Check if a string looks like a real file extension.
pub(super) fn is_likely_extension(ext: &str) -> bool {
    matches!(
        ext,
        "mkv"
            | "mp4"
            | "avi"
            | "wmv"
            | "flv"
            | "mov"
            | "webm"
            | "ogm"
            | "ogv"
            | "ts"
            | "m2ts"
            | "m4v"
            | "mpg"
            | "mpeg"
            | "vob"
            | "divx"
            | "3gp"
            | "srt"
            | "sub"
            | "ssa"
            | "ass"
            | "idx"
            | "sup"
            | "vtt"
            | "nfo"
            | "txt"
            | "jpg"
            | "jpeg"
            | "png"
            | "nzb"
            | "par"
            | "par2"
            | "iso"
            | "img"
            | "rar"
            | "zip"
            | "7z"
    )
}

/// Detect if a title looks like a scene abbreviation.
pub(super) fn is_abbreviated(title: &str) -> bool {
    let segments: Vec<&str> = title
        .split(|c: char| c.is_whitespace() || c == '-')
        .collect();
    segments.iter().all(|w| {
        w.len() <= 6
            && w.chars()
                .all(|c| c.is_ascii_lowercase() || c.is_ascii_digit())
    }) && title.len() <= 20
}

/// Score a string by casing quality. Higher = better casing.
///
/// Hoisted out of `pick_better_casing` to be directly unit-testable, so
/// each branch's exact return value gets pinned (rather than only being
/// observable through the comparison in `pick_better_casing`). This
/// shape was the highest-leverage mutation-testing finding from the
/// first nightly run — see docs/src/contributor-guide/mutation-baseline.md, three function-
/// stub mutants survived because no test pinned the actual scores.
///
/// Scoring rationale:
/// - All-uppercase letters (`-10`): SHOUTING titles are usually a
///   poor source compared to anything mixed-case.
/// - All-lowercase (`-5`): less bad than SHOUTING but still poor.
///   Note: a string with no alphabetic chars (e.g. "123") trivially
///   satisfies the all-uppercase predicate (vacuous truth on an
///   empty filter) and scores `-10`. Acceptable: such strings rarely
///   make it to this point as titles.
/// - Otherwise: count of whitespace-separated words starting with an
///   uppercase letter (Title Case scores higher than lower).
#[inline]
pub(super) fn casing_score(s: &str) -> i32 {
    if s.chars()
        .filter(|c| c.is_alphabetic())
        .all(|c| c.is_uppercase())
    {
        return -10;
    }
    if s.chars()
        .filter(|c| c.is_alphabetic())
        .all(|c| c.is_lowercase())
    {
        return -5;
    }
    s.split_whitespace()
        .filter(|w| w.starts_with(|c: char| c.is_uppercase()))
        .count() as i32
}

/// Pick the string with better casing when two titles match case-insensitively.
///
/// Ties go to `a` (left-hand argument), via `>=`. Callers rely on this
/// stable choice when the scores are identical.
pub(super) fn pick_better_casing<'a>(a: &'a str, b: &'a str) -> &'a str {
    if casing_score(a) >= casing_score(b) {
        a
    } else {
        b
    }
}

/// Check if a directory name is generic (should be skipped for title).
///
/// Generic directories are structural (e.g., "Season 1", "Extras") or
/// organizational (e.g., "Movies", "Downloads"). When walking parent
/// directories for title fallback, these are skipped so the real title
/// directory (e.g., "Transformers 1984") is found.
pub(crate) fn is_generic_dir(name: &str) -> bool {
    let lower = name.to_lowercase();

    // Exact matches (case-insensitive).
    if matches!(
        lower.as_str(),
        // Library root / organizational
        "movies"
            | "movie"
            | "films"
            | "film"
            | "series"
            | "tv shows"
            | "tvshows"
            | "tv"
            | "media"
            | "video"
            | "videos"
            | "anime"
            | "donghua"
            | "kids"
            | "cartoons"
            | "shows"
            | "documentary"
            | "documentaries"
            | "music"
            | "concert"
            | "concerts"
            // Language categories (library organization, not show titles)
            | "chinese"
            | "english"
            | "japanese"
            | "korean"
            | "french"
            | "german"
            | "spanish"
            | "italian"
            | "portuguese"
            | "russian"
            | "thai"
            | "hindi"
            | "arabic"
            // Download / system
            | "downloads"
            | "download"
            | "completed"
            | "mnt"
            | "nas"
            | "share"
            | "shares"
            | "data"
            | "public"
            | "home"
            | "tmp"
            | "temp"
            // Bonus / extras
            | "extras"
            | "extra"
            | "specials"
            | "special"
            | "bonus"
            | "featurettes"
            | "featurette"
            | "behind the scenes"
            | "deleted scenes"
            | "interviews"
            | "interview"
            | "trailers"
            | "trailer"
            | "samples"
            | "sample"
            // CJK bonus / extras directory names
            | "特典映像"  // tokuten eizou — special footage (JP)
            | "特典"      // tokuten — bonus/extras (JP)
            | "映像特典"  // eizou tokuten — video bonus (JP)
            | "sp"
            // Anime-extras structural directory names. Real-world layouts:
            //   Show/PV/file.mkv, Show/NCOP&NCED/file.mkv, Show/menu/file.mkv
            // These are STRUCTURAL groupings (preview clips, creditless
            // openings/endings, BD menu screens) — not the show title.
            // Without this list, parent_dir would leak "PV"/"menu"/etc.
            // as the title in --batch -r mode. (#244)
            | "pv"
            | "op"
            | "ed"
            | "ncop"
            | "nced"
            | "ncop&nced"
            | "nced&ncop"
            | "menu"
            | "menus"
            | "ova"
            | "oad"
            | "ona"
            | "cm"
            | "tokuten"
            // Subtitles / audio
            | "subs"
            | "subtitles"
            | "subtitle"
            | "ost"
            | "soundtrack"
            | "soundtracks"
    ) {
        return true;
    }

    // Prefix matches (e.g., "Season 1", "Disc 2", "CD1").
    if lower.starts_with("season")
        || lower.starts_with("saison")
        || lower.starts_with("temporada")
        || lower.starts_with("stagione")
        || lower.starts_with("disc")
        || lower.starts_with("disk")
        || lower.starts_with("dvd")
    {
        return true;
    }

    // CD1, CD2, etc.
    if lower.starts_with("cd") && lower[2..].chars().all(|c| c.is_ascii_digit()) && lower.len() <= 4
    {
        return true;
    }

    // Quality-as-dir: "1080p", "720p", "2160p", "4K", "4k"
    if lower.ends_with('p') && lower[..lower.len() - 1].chars().all(|c| c.is_ascii_digit()) {
        return true;
    }
    if lower == "4k" {
        return true;
    }

    false
}

#[cfg(test)]
mod tests {
    use super::*;

    // ── Pipeline integration ─────────────────────────────────────────

    #[test]
    fn test_clean_title_dots() {
        assert_eq!(clean_title("The.Matrix"), "The Matrix");
    }

    #[test]
    fn test_clean_title_underscores() {
        assert_eq!(clean_title("The_Matrix_Reloaded"), "The Matrix Reloaded");
    }

    #[test]
    fn test_strip_leading_bracket() {
        assert_eq!(clean_title("[XCT].Le.Prestige"), "Le Prestige");
    }

    #[test]
    fn test_strip_paren_year() {
        assert_eq!(clean_title("Movie Name (2005)"), "Movie Name");
    }

    // ── Per-step unit tests ──────────────────────────────────────────

    #[test]
    fn step_strip_leading_brackets_drops_multiple() {
        assert_eq!(strip_leading_brackets("[A][B] Show"), "Show");
        assert_eq!(strip_leading_brackets("[XCT].Le.Prestige"), "Le.Prestige");
    }

    #[test]
    fn step_strip_leading_brackets_unclosed_passes_through() {
        // No closing ']' → leave the input alone (don't loop forever).
        assert_eq!(strip_leading_brackets("[unclosed Show"), "[unclosed Show");
    }

    #[test]
    fn step_strip_paren_year_only_at_end() {
        // The regex consumes leading whitespace before `(YYYY)`.
        assert_eq!(strip_paren_year("Movie (2005)"), "Movie");
        // Year in the middle is preserved (only trailing year is stripped).
        assert_eq!(strip_paren_year("(2005) Movie"), "(2005) Movie");
    }

    #[test]
    fn step_strip_paren_groups_empty_fallback() {
        // Stripping all parens would empty the string → return the original.
        assert_eq!(strip_paren_groups("(only paren)"), "(only paren)");
        // Otherwise strip them.
        assert_eq!(strip_paren_groups("Movie (alt)"), "Movie ");
    }

    #[test]
    fn step_normalize_preserves_word_dash() {
        let out = normalize_separators("Spider-Man.2002", DashPolicy::WordDashOnly);
        assert_eq!(out, "Spider-Man 2002");
    }

    #[test]
    fn step_normalize_drops_separator_flanked_dash() {
        // Default policy: " - " becomes a single space.
        let out = normalize_separators("Show - Sub", DashPolicy::WordDashOnly);
        assert_eq!(out, "Show Sub");
    }

    #[test]
    fn step_normalize_preserves_separator_flanked_dash_in_preserve_mode() {
        // PreserveStructuralDash keeps space-flanked, dot-flanked, and
        // underscore-flanked dashes as a literal " - ".
        assert_eq!(
            normalize_separators("Show - Sub", DashPolicy::PreserveStructuralDash),
            "Show - Sub"
        );
        assert_eq!(
            normalize_separators("Show_-_Sub_-_Final", DashPolicy::PreserveStructuralDash),
            "Show - Sub - Final"
        );
        assert_eq!(
            normalize_separators("Show.-.Sub", DashPolicy::PreserveStructuralDash),
            "Show - Sub"
        );
        // But word-dashes still survive even in preserve mode.
        assert_eq!(
            normalize_separators("Spider-Man", DashPolicy::PreserveStructuralDash),
            "Spider-Man"
        );
    }

    #[test]
    fn preserve_dashes_keeps_inner_separator() {
        // Standard clean_title collapses " - " into a single space.
        assert_eq!(clean_title("Show - Subtitle"), "Show Subtitle");
        // The preserve variant keeps the structural separator literal.
        assert_eq!(
            clean_title_preserve_dashes("Show - Subtitle"),
            "Show - Subtitle"
        );
        // And it does not strip a trailing "Part N" (which is genuine title content).
        assert_eq!(
            clean_title_preserve_dashes("San no Shou Part 2"),
            "San no Shou Part 2"
        );
        // "_-_" and ".-." should normalize to " - " too.
        assert_eq!(
            clean_title_preserve_dashes("Show_-_Sub_-_Final"),
            "Show - Sub - Final"
        );
    }

    #[test]
    fn preserve_dashes_kitchen_sink_composition() {
        // Kitchen-sink test: locks in the *composition order* of every
        // transform inside `clean_title_preserve_dashes` simultaneously.
        //
        // Pre-PR-C this composition was only exercised piecewise (one
        // transform per test). When the pipeline was decomposed in #130,
        // the per-transform tests caught regressions inside each step,
        // but no single test caught "Step 2 strips the year that Step 4
        // expected to see, leaving Step 4 a no-op". This test pins the
        // full chain end-to-end so any future re-decomposition of
        // `clean.rs` (and there will be one — see DESIGN D10) cannot
        // silently change interaction order.
        //
        // Composition under exercise (left to right, all in one input):
        //   1. strip_leading_brackets:   `[Group] ` → ""
        //   2. strip_paren_year:         ` (2014)` at end → ""
        //                                (only fires at end-of-string)
        //   3. strip_paren_groups:       `(Director's Cut)` mid-string → " "
        //   4. normalize_separators(PreserveStructuralDash):
        //        - dot-acronyms preserved
        //        - `_-_` and `.-.` and ` - ` → ` - `
        //        - other separators → single space
        //   5. trim_trailing_punct:      strip trailing `:-,;`
        //
        // Note: the trailing-keyword strip (Step 6) is intentionally NOT
        // applied by `clean_title_preserve_dashes` — "Part N" is genuine
        // title content for this code path.
        let input =
            "[Group].Show_-_Sub.-.Detail.(Director's.Cut).Part.2.S.H.I.E.L.D._-_End.(2014).";
        // Note: the dot-acronym detector greedily extends "S.H.I.E.L.D."
        // backwards to include the preceding `2.` (since `2` is also
        // alphanumeric, the run `2.S.H.I.E.L.D.` matches the
        // `[A-Za-z0-9](\.[A-Za-z0-9]){2,}\.?` pattern in one shot). The
        // trailing dot of the acronym also survives. This is the
        // documented (and tested below in `step_normalize_preserves_dot_acronyms`)
        // behavior; pinning it explicitly here so any change shows up
        // as a clear cross-step regression rather than as a mysterious
        // failure in a single sub-step test.
        let expected = "Show - Sub - Detail Part 2.S.H.I.E.L.D. - End";
        assert_eq!(
            clean_title_preserve_dashes(input),
            expected,
            "composition order regression: each step must run on the \
             output of the previous one in the documented sequence"
        );
    }

    #[test]
    fn step_normalize_preserves_dot_acronyms() {
        let out = normalize_separators("Agents.of.S.H.I.E.L.D.S01", DashPolicy::WordDashOnly);
        assert!(out.contains("S.H.I.E.L.D"), "got: {out}");
    }

    #[test]
    fn step_trim_trailing_punct() {
        assert_eq!(trim_trailing_punct("Title -"), "Title");
        assert_eq!(trim_trailing_punct("Title:,;"), "Title");
        assert_eq!(trim_trailing_punct("Title"), "Title");
    }

    #[test]
    fn step_strip_trailing_keywords() {
        // The Part / Season / Episode regexes start with `\s+` so they
        // consume the space before the keyword. The bonus regex starts
        // with `[-]` so it does NOT eat the leading space — the trailing
        // space remains in the result. This matches pre-refactor behavior
        // exactly; trimming is the caller's job.
        assert_eq!(strip_trailing_keywords("Show Part 2"), "Show");
        assert_eq!(strip_trailing_keywords("Show Season 3"), "Show");
        assert_eq!(strip_trailing_keywords("Show Episode"), "Show");
        assert_eq!(strip_trailing_keywords("Show -x05"), "Show ");
        // Empty fallback: don't strip if the result would be empty.
        assert_eq!(strip_trailing_keywords("Part 2"), "Part 2");
    }

    #[test]
    fn episode_title_keeps_part_n() {
        // clean_episode_title must NOT strip trailing "Part N" — that's
        // valid episode-title content.
        assert_eq!(
            clean_episode_title("The Battle Part 2"),
            "The Battle Part 2"
        );
    }

    #[test]
    fn episode_title_trims_leading_seps() {
        assert_eq!(clean_episode_title(" - The Battle"), "The Battle");
        assert_eq!(clean_episode_title(".._The Battle"), "The Battle");
    }

    // ── is_generic_dir ──────────────────────────────────────────────

    #[test]
    fn generic_dir_originals() {
        // Original entries still work.
        assert!(is_generic_dir("Movies"));
        assert!(is_generic_dir("tv"));
        assert!(is_generic_dir("Season 1"));
        assert!(is_generic_dir("Saison 03"));
    }

    #[test]
    fn generic_dir_extras_and_bonus() {
        assert!(is_generic_dir("Extras"));
        assert!(is_generic_dir("Specials"));
        assert!(is_generic_dir("Bonus"));
        assert!(is_generic_dir("Featurettes"));
        assert!(is_generic_dir("Behind The Scenes"));
        assert!(is_generic_dir("Deleted Scenes"));
        assert!(is_generic_dir("Trailers"));
        assert!(is_generic_dir("Sample"));
    }

    #[test]
    fn generic_dir_disc_and_cd() {
        assert!(is_generic_dir("Disc 1"));
        assert!(is_generic_dir("Disc2"));
        assert!(is_generic_dir("Disk 3"));
        assert!(is_generic_dir("DVD1"));
        assert!(is_generic_dir("CD1"));
        assert!(is_generic_dir("CD2"));
        assert!(!is_generic_dir("CD123")); // too long for CD pattern
    }

    #[test]
    fn generic_dir_quality() {
        assert!(is_generic_dir("1080p"));
        assert!(is_generic_dir("720p"));
        assert!(is_generic_dir("2160p"));
        assert!(is_generic_dir("4K"));
    }

    // ── #146 closer: kill the last 2 surviving mutants ────────────────
    //
    // The 2026-04-19 nightly surfaced two single-mutant clusters in
    // this file that no test pinned. These tests close them out and
    // complete the #173 triage roadmap.

    #[test]
    fn generic_dir_recognizes_all_season_prefix_synonyms() {
        // Pin `|| -> &&` mutants on the prefix-match chain at
        // is_generic_dir lines 514-519. Each `lower.starts_with(...)`
        // OR-arm must be exercised by at least one assertion: with
        // `|| -> &&` on any single arm, the chain becomes a giant AND
        // that returns false for any single-prefix input.
        //
        // Existing tests covered "Season" / "Saison" / "Disc" / "Disk".
        // Missing coverage: "Temporada" (PT), "Stagione" (IT), "DVD".
        // Adding these kills the surviving line-516 mutant and pins
        // every remaining || in the chain for free.
        assert!(
            is_generic_dir("Temporada 2"),
            "Portuguese 'Temporada' (Season) prefix"
        );
        assert!(
            is_generic_dir("Stagione 1"),
            "Italian 'Stagione' (Season) prefix"
        );
        assert!(is_generic_dir("DVD9"), "DVD prefix (e.g., DVD5, DVD9)");
        assert!(is_generic_dir("dvdrip"), "DVD prefix is case-insensitive");
    }

    #[test]
    fn classify_dash_word_dash_when_both_flanks_alphanumeric() {
        // Happy path: "Spider-Man" — alnum on both sides → WordDash.
        let chars: Vec<char> = "Spider-Man".chars().collect();
        let dash_idx = chars.iter().position(|&c| c == '-').unwrap();
        assert_eq!(classify_dash(&chars, dash_idx), DashKind::WordDash);
    }

    #[test]
    fn classify_dash_separator_flanked_when_both_sides_are_separators() {
        // Pin the SeparatorFlanked branch: space-dash-space.
        // Required to confirm the branch is reachable before pinning the
        // && -> || mutant in the next test.
        let chars: Vec<char> = "Show - Title".chars().collect();
        let dash_idx = chars.iter().position(|&c| c == '-').unwrap();
        assert_eq!(classify_dash(&chars, dash_idx), DashKind::SeparatorFlanked);
    }

    #[test]
    fn classify_dash_other_when_only_one_flank_is_separator() {
        // Pin `&& -> ||` mutant on `is_sep(prev) && is_sep(next)`.
        //
        // Asymmetric flanks: separator on ONE side, non-alnum non-sep on
        // the other. With the original `&&`, both must be separators →
        // returns Other (correct). With the mutant `||`, EITHER being a
        // separator suffices → returns SeparatorFlanked (BUG).
        //
        // "Foo -[Bar" — the dash has a space before (separator) but '[// after, which is neither alnum nor a SEPS member. Both alnum
        // checks fail, so the alnum branch doesn't fire. Then the sep
        // check: prev=' ' is sep, next='[' is NOT a sep → the original
        // returns Other; the mutant would return SeparatorFlanked.
        let chars: Vec<char> = "Foo -[Bar".chars().collect();
        let dash_idx = chars.iter().position(|&c| c == '-').unwrap();
        assert_eq!(classify_dash(&chars, dash_idx), DashKind::Other);

        // Mirror case: '[' before, separator after.
        let chars: Vec<char> = "[- Bar".chars().collect();
        let dash_idx = chars.iter().position(|&c| c == '-').unwrap();
        assert_eq!(classify_dash(&chars, dash_idx), DashKind::Other);
    }

    #[test]
    fn classify_dash_at_boundaries() {
        // Belt: dash at index 0 (no prev) and at last index (no next).
        // Pins the `i > 0` boundary check at the top of classify_dash.
        let chars: Vec<char> = "-Foo".chars().collect();
        // prev=None, next='F' (alnum). is_alnum(None)=false, so the
        // alnum branch is false; is_sep(None)=false, so sep branch false
        // → Other.
        assert_eq!(classify_dash(&chars, 0), DashKind::Other);

        let chars: Vec<char> = "Foo-".chars().collect();
        let last = chars.len() - 1;
        // prev='o' (alnum), next=None. alnum branch needs both → false;
        // sep branch needs both → false → Other.
        assert_eq!(classify_dash(&chars, last), DashKind::Other);
    }

    #[test]
    fn generic_dir_subtitles_and_audio() {
        assert!(is_generic_dir("Subs"));
        assert!(is_generic_dir("Subtitles"));
        assert!(is_generic_dir("OST"));
        assert!(is_generic_dir("Soundtrack"));
    }

    #[test]
    fn generic_dir_structural() {
        assert!(is_generic_dir("Anime"));
        assert!(is_generic_dir("Kids"));
        assert!(is_generic_dir("Cartoons"));
        assert!(is_generic_dir("Shows"));
        assert!(is_generic_dir("Documentary"));
        assert!(is_generic_dir("Documentaries"));
        assert!(is_generic_dir("Music"));
        assert!(is_generic_dir("Concert"));
        assert!(is_generic_dir("Concerts"));
    }

    #[test]
    fn generic_dir_language_categories() {
        assert!(is_generic_dir("Chinese"));
        assert!(is_generic_dir("English"));
        assert!(is_generic_dir("Japanese"));
        assert!(is_generic_dir("Korean"));
        assert!(is_generic_dir("French"));
        assert!(is_generic_dir("German"));
        assert!(is_generic_dir("Spanish"));
        assert!(is_generic_dir("Italian"));
        assert!(is_generic_dir("Portuguese"));
        assert!(is_generic_dir("Russian"));
        assert!(is_generic_dir("Thai"));
        assert!(is_generic_dir("Hindi"));
        assert!(is_generic_dir("Arabic"));
    }

    #[test]
    fn generic_dir_cjk_bonus() {
        assert!(is_generic_dir("特典映像"));
        assert!(is_generic_dir("特典"));
        assert!(is_generic_dir("映像特典"));
        assert!(is_generic_dir("SP"));
    }

    #[test]
    fn non_generic_dirs() {
        // Real titles should NOT be generic.
        assert!(!is_generic_dir("Paw Patrol"));
        assert!(!is_generic_dir("Transformers 1984"));
        assert!(!is_generic_dir("Breaking Bad"));
        assert!(!is_generic_dir("十二国記"));
    }

    // ── casing_score: pin every branch's exact return value ────────
    //
    // Designed against the surviving mutants reported in the first
    // mutation nightly (run 24615983143). Three function-stub mutants
    // (return 0, return 1, return -1) survived because no test pinned
    // the exact score — only the downstream comparison was observed.
    // These tests assert the precise integer to slam that door shut.
    // See docs/src/contributor-guide/mutation-baseline.md for the full triage write-up.

    #[test]
    fn casing_score_all_uppercase_returns_minus_ten() {
        assert_eq!(casing_score("THE MATRIX"), -10);
        assert_eq!(casing_score("AVENGERS"), -10);
        // Single all-upper letter: still all-uppercase.
        assert_eq!(casing_score("X"), -10);
    }

    #[test]
    fn casing_score_all_lowercase_returns_minus_five() {
        assert_eq!(casing_score("the matrix"), -5);
        assert_eq!(casing_score("avengers"), -5);
        assert_eq!(casing_score("x"), -5);
    }

    #[test]
    fn casing_score_title_case_counts_capitalized_words() {
        assert_eq!(casing_score("The Matrix"), 2);
        assert_eq!(casing_score("Star Wars Episode IV"), 4);
        // Single capitalized word.
        assert_eq!(casing_score("Matrix"), 1);
    }

    #[test]
    fn casing_score_mixed_case_only_caps_starts_count() {
        // "the Matrix" → 1 (only "Matrix" starts uppercase)
        assert_eq!(casing_score("the Matrix"), 1);
        // "The matrix Reloaded" → 2 ("The" and "Reloaded")
        assert_eq!(casing_score("The matrix Reloaded"), 2);
    }

    #[test]
    fn casing_score_no_alphabetic_treats_as_all_upper() {
        // Documented edge case: vacuous truth on the empty alphabetic
        // filter means an all-digit string short-circuits to -10.
        // Pinning this so the contract survives future refactors.
        assert_eq!(casing_score(""), -10);
        assert_eq!(casing_score("123"), -10);
        assert_eq!(casing_score("   "), -10);
    }

    // ── pick_better_casing: covers the >= boundary mutation ─────────
    //
    // The fourth surviving mutant from #146 was at the `>=` comparison
    // (line :388 in the pre-hoist version). The tie test below pins
    // left-bias on equal scores; if `>=` is mutated to `>`, ties would
    // swap to `b` and the test fails. The strict-inequality cases also
    // catch other comparator mutations (`<`, `<=`, `==`, `!=`).

    #[test]
    fn pick_better_casing_picks_higher_score() {
        // a > b: "The Matrix" (2) beats "the matrix" (-5)
        assert_eq!(pick_better_casing("The Matrix", "the matrix"), "The Matrix");
        // b > a: "the matrix" (-5) loses to "The Matrix" (2)
        assert_eq!(pick_better_casing("the matrix", "The Matrix"), "The Matrix");
        // SHOUTING (-10) loses to anything mixed-case.
        assert_eq!(pick_better_casing("THE MATRIX", "The Matrix"), "The Matrix");
        // SHOUTING (-10) loses to lowercase (-5) too.
        assert_eq!(pick_better_casing("THE MATRIX", "the matrix"), "the matrix");
    }

    #[test]
    fn pick_better_casing_tie_returns_left() {
        // Both score 2 ("Title Case" two-word strings). The `>=` makes
        // ties go to `a`. Mutating `>=` to `>` would flip this to `b`.
        assert_eq!(pick_better_casing("The Matrix", "Star Wars"), "The Matrix");
        assert_eq!(pick_better_casing("Star Wars", "The Matrix"), "Star Wars");
        // Both score -5 (all-lowercase): also tie → left.
        assert_eq!(pick_better_casing("the matrix", "star wars"), "the matrix");
        // Both score -10 (all-uppercase): also tie → left.
        assert_eq!(pick_better_casing("THE MATRIX", "STAR WARS"), "THE MATRIX");
        // Identical inputs: trivially tie → left.
        assert_eq!(pick_better_casing("Same", "Same"), "Same");
    }

    // ── strip_extension boundary tests ────────────────────────
    //
    // Five mutants survived in strip_extension as of the 2026-04-19
    // nightly (#146). Each test below is named for the specific
    // mutation it kills. The function is small (8 lines) but
    // semantically dense — every operator and condition matters.

    #[test]
    fn strip_extension_no_dot_returns_input_unchanged() {
        // Pins the function-stub mutant `replace strip_extension -> &str
        // with ""`. With the mutation, this would return "" instead of
        // "NoExtensionHere", which is plainly wrong.
        assert_eq!(strip_extension("NoExtensionHere"), "NoExtensionHere");
    }

    #[test]
    fn strip_extension_known_extension_strips_dot_and_ext() {
        // Pins the function-stub mutant for the happy path — confirms
        // the function returns the actual prefix, not "".
        assert_eq!(strip_extension("The.Matrix.mkv"), "The.Matrix");
        assert_eq!(strip_extension("movie.mp4"), "movie");
    }

    #[test]
    fn strip_extension_dot_plus_one_indexing_is_correct() {
        // Pins `+ -> -` and `+ -> *` in `dot + 1..`.
        //
        // For "foo.mkv" (dot at index 3):
        //   - dot + 1 = 4 → ext = "mkv" (correct, is_likely_extension=true)
        //   - dot - 1 = 2 → ext = "o.mkv" (5 chars, but not a known
        //     extension → returns whole input unchanged)
        //   - dot * 1 = 3 → ext = ".mkv" (4 chars, not a known extension
        //     because of the leading dot → returns whole input unchanged)
        //
        // Either mutation produces "foo.mkv" instead of "foo".
        assert_eq!(strip_extension("foo.mkv"), "foo");
    }

    #[test]
    fn strip_extension_unknown_short_extension_keeps_input() {
        // Pins `&& -> ||` in `ext.len() <= 5 && is_likely_extension(...)`.
        //
        // "foo.xyzab" has a 5-char extension that satisfies len <= 5
        // but is_likely_extension("xyzab") returns false.
        //   - With `&&`: false → return whole input "foo.xyzab"
        //   - With `||`: true (length OK) → strip → "foo"  (BUG)
        //
        // Asserting the input survives kills the `||` mutation.
        assert_eq!(strip_extension("foo.xyzab"), "foo.xyzab");
    }

    #[test]
    fn strip_extension_long_known_lookalike_keeps_input() {
        // Belt-and-suspenders for `<= -> >`. While none of our recognized
        // extensions happen to be exactly 5 chars, this test pins the
        // length gate against "too long to be plausible":
        //
        // "sample.notarealextension" — ext is 17 chars.
        //   - With `<=`: 17 <= 5 false → return whole input (correct)
        //   - With `>`:  17 > 5 true → fall to is_likely_extension
        //     (returns false for "notarealextension") → still returns
        //     whole input. Equivalent for this case alone.
        //
        // The kill for `<= -> >` actually comes from the test below.
        assert_eq!(
            strip_extension("sample.notarealextension"),
            "sample.notarealextension"
        );
    }

    #[test]
    fn strip_extension_known_three_char_extension_pins_le_boundary() {
        // Pins `<= -> >` in `ext.len() <= 5`.
        //
        // "clip.mkv" — ext is 3 chars, is_likely_extension("mkv")=true.
        //   - With `<=`: 3 <= 5 true → AND with is_likely=true → strip → "clip"
        //   - With `>`:  3 > 5 false → return whole input "clip.mkv" (BUG)
        //
        // Asserting the strip happens kills `<= -> >` (and reinforces
        // the function-stub mutant kill from above).
        assert_eq!(strip_extension("clip.mkv"), "clip");
        // Also exercise a 4-char known extension ("webm"):
        assert_eq!(strip_extension("video.webm"), "video");
    }

    #[test]
    fn strip_extension_case_insensitive_match() {
        // Documented behaviour: extension matching uses to_lowercase.
        // Belt for the `is_likely_extension(&ext_lower)` call site —
        // confirms the lowercasing is in the loop, not skipped.
        assert_eq!(strip_extension("Movie.MKV"), "Movie");
        assert_eq!(strip_extension("Trailer.Mp4"), "Trailer");
    }

    // ── normalize_separators helper boundary tests (#146) ───────────────
    //
    // Three mutants survived in normalize_separators on lines 154 + 164
    // as of the 2026-04-19 nightly. Both predicates are now hoisted to
    // free functions; the tests below pin every operator and boundary.

    #[test]
    fn acronym_match_starts_at_separator_at_position_zero_returns_false() {
        // Pin `> -> >=` mutant on `match_start > 0`.
        // At position 0 there is no preceding byte to inspect, so the
        // function MUST short-circuit to false (not panic).
        //   - With `>`:  0 > 0 is false (correct, returns false)
        //   - With `>=`: 0 >= 0 is true → dereferences input.as_bytes()[0]
        //     which for "S.H.I.E.L.D" is b'S' (not a separator), so it
        //     would still return false here. So this test alone DOES NOT
        //     kill `> -> >=`. The next test below uses an input where the
        //     position-0 byte IS a separator to force the kill.
        assert!(!acronym_match_starts_at_separator("S.H.I.E.L.D", 0));
    }

    #[test]
    fn acronym_match_starts_at_separator_position_zero_with_separator_byte() {
        // Pin `> -> >=` mutant strongly: at position 0 with a separator
        // byte at index 0, the original `> 0` short-circuits to false,
        // but the mutant `>= 0` would proceed to inspect the byte and
        // see a separator, returning true.
        //
        // Inputs where byte 0 is a separator: " foo", ".foo", "_foo".
        //   - With `>`:  0 > 0 false → false (correct: nothing to skip
        //     before position 0 even if byte 0 is a separator).
        //   - With `>=`: 0 >= 0 true AND b' ' matches → true (BUG).
        assert!(!acronym_match_starts_at_separator(" foo", 0));
        assert!(!acronym_match_starts_at_separator(".foo", 0));
        assert!(!acronym_match_starts_at_separator("_foo", 0));
    }

    #[test]
    fn acronym_match_starts_at_separator_with_each_separator_byte() {
        // Pin `&& -> ||` mutant on the `match_start > 0 && matches!(...)`.
        //   - With `&&`: both must be true. At position 1 with a non-sep
        //     byte at index 1, both branches: pos>0=true, byte_is_sep=false
        //     → false (correct).
        //   - With `||`: either is enough. pos>0=true alone returns true
        //     even if byte is NOT a separator (BUG).
        //
        // Test 1: position > 0 with NON-separator byte → must be false.
        assert!(!acronym_match_starts_at_separator("abcd", 2));

        // Test 2: position > 0 with each of the four separator bytes → true.
        assert!(acronym_match_starts_at_separator("a foo", 1)); // space
        assert!(acronym_match_starts_at_separator("a\tfoo", 1)); // tab
        assert!(acronym_match_starts_at_separator("a.foo", 1)); // dot
        assert!(acronym_match_starts_at_separator("a_foo", 1)); // underscore
    }

    #[test]
    fn position_in_any_range_empty_list_returns_false() {
        // Function-stub-ish: empty .any() must return false.
        assert!(!position_in_any_range(0, &[]));
        assert!(!position_in_any_range(100, &[]));
    }

    #[test]
    fn position_in_any_range_pins_lower_bound_inclusive() {
        // Pin `>= -> <` and `>= -> >` mutants on `pos >= *s`.
        //
        // Range is [10, 20). pos=10 is the inclusive lower bound.
        //   - With `>=`: 10 >= 10 true → inside (correct)
        //   - With `>`:  10 > 10 false → outside (BUG)
        //   - With `<`:  10 < 10 false → outside (BUG)
        assert!(position_in_any_range(10, &[(10, 20)]));
    }

    #[test]
    fn position_in_any_range_pins_upper_bound_exclusive() {
        // Pin `< -> ==`, `< -> >`, `< -> <=` mutants on `pos < *e`.
        //
        // Range is [10, 20). pos=20 is the EXCLUSIVE upper bound.
        //   - With `<`:  20 < 20 false → outside (correct)
        //   - With `<=`: 20 <= 20 true → inside (BUG)
        assert!(!position_in_any_range(20, &[(10, 20)]));

        // pos=19 is the last position INSIDE the range.
        //   - With `<`:  19 < 20 true → inside (correct)
        //   - With `>`:  19 > 20 false → outside (BUG)
        //   - With `==`: 19 == 20 false → outside (BUG)
        assert!(position_in_any_range(19, &[(10, 20)]));
    }

    #[test]
    fn position_in_any_range_pins_and_to_or_with_disjoint_pos() {
        // Pin `&& -> ||` mutant on `pos >= *s && pos < *e`.
        //
        // pos=5, range=[10, 20):
        //   - pos >= 10 is false; pos < 20 is true.
        //   - With `&&`: false && true → false → outside (correct).
        //   - With `||`: false || true → true → inside (BUG).
        assert!(!position_in_any_range(5, &[(10, 20)]));

        // pos=25, range=[10, 20):
        //   - pos >= 10 is true; pos < 20 is false.
        //   - With `&&`: true && false → false → outside (correct).
        //   - With `||`: true || false → true → inside (BUG).
        assert!(!position_in_any_range(25, &[(10, 20)]));
    }

    #[test]
    fn position_in_any_range_finds_match_in_second_range() {
        // Belt: confirms .any() actually iterates past non-matching ranges.
        let ranges = [(0, 5), (10, 20), (30, 40)];
        assert!(position_in_any_range(15, &ranges));
        assert!(position_in_any_range(35, &ranges));
        assert!(!position_in_any_range(7, &ranges));
        assert!(!position_in_any_range(25, &ranges));
    }
}