Skip to main content

config_disassembler/xml/
cli.rs

1//! Command-line interface for the xml-disassembler binary.
2//!
3//! Kept in the library crate so it can be exercised by unit tests and
4//! the binary stays a thin shim.
5
6use crate::xml::{
7    DecomposeRule, DisassembleXmlFileHandler, MultiLevelRule, ReassembleXmlFileHandler, SidecarSpec,
8};
9
10/// Options parsed from disassemble CLI args.
11pub struct DisassembleOpts<'a> {
12    pub path: Option<&'a str>,
13    pub unique_id_elements: Option<&'a str>,
14    pub pre_purge: bool,
15    pub post_purge: bool,
16    /// Explicit `--ignore-path` value. `None` means the caller did not
17    /// pass the flag and the runner should resolve a default (see
18    /// [`crate::xml::ignore_file::resolve_xml_ignore_path`]).
19    ///
20    /// [`crate::xml::ignore_file::resolve_xml_ignore_path`]: crate::ignore_file::resolve_xml_ignore_path
21    pub ignore_path: Option<&'a str>,
22    pub format: &'a str,
23    pub strategy: Option<&'a str>,
24    pub multi_level: Option<String>,
25    pub split_tags: Option<String>,
26    /// Comma-separated `element:extension` pairs, e.g. `"schema:yaml"`.
27    pub sidecar_elements: Option<String>,
28}
29
30/// Parse --split-tags spec for grouped-by-tag. Comma-separated rules; each rule:
31/// `tag:mode:field` (path_segment defaults to tag) or `tag:path:mode:field`.
32/// mode = "split" (one file per item) or "group" (group by field).
33pub fn parse_decompose_spec(spec: &str) -> Vec<DecomposeRule> {
34    let mut rules = Vec::new();
35    for part in spec.split(',') {
36        let part = part.trim();
37        let segments: Vec<&str> = part.splitn(4, ':').collect();
38        if segments.len() >= 3 {
39            let tag = segments[0].to_string();
40            let (path_segment, mode, field) = if segments.len() == 3 {
41                (
42                    tag.clone(),
43                    segments[1].to_string(),
44                    segments[2].to_string(),
45                )
46            } else {
47                (
48                    segments[1].to_string(),
49                    segments[2].to_string(),
50                    segments[3].to_string(),
51                )
52            };
53            if !tag.is_empty() && !mode.is_empty() && !field.is_empty() {
54                rules.push(DecomposeRule {
55                    tag,
56                    path_segment,
57                    mode,
58                    field,
59                });
60            }
61        }
62    }
63    rules
64}
65
66/// Parse a single --multi-level spec: `file_pattern:root_to_strip:unique_id_elements`.
67pub fn parse_multi_level_spec(spec: &str) -> Option<MultiLevelRule> {
68    let parts: Vec<&str> = spec.splitn(3, ':').collect();
69    if parts.len() != 3 {
70        return None;
71    }
72    let (file_pattern, root_to_strip, unique_id_elements) = (parts[0], parts[1], parts[2]);
73    if file_pattern.is_empty() || root_to_strip.is_empty() || unique_id_elements.is_empty() {
74        return None;
75    }
76    let path_segment = crate::xml::path_segment_from_file_pattern(file_pattern);
77    Some(MultiLevelRule {
78        file_pattern: file_pattern.to_string(),
79        root_to_strip: root_to_strip.to_string(),
80        unique_id_elements: unique_id_elements.to_string(),
81        path_segment: path_segment.clone(),
82        wrap_root_element: root_to_strip.to_string(),
83        wrap_xmlns: String::new(),
84    })
85}
86
87/// Parse one or more --multi-level specs separated by `;`.
88///
89/// Each rule is `file_pattern:root_to_strip:unique_id_elements`; rules are joined by `;`
90/// because the third part is itself a comma-separated list. Empty rules (e.g. trailing `;`)
91/// are skipped silently. Malformed rules are dropped (the caller may warn separately if it
92/// needs to surface that to the user).
93pub fn parse_multi_level_specs(spec: &str) -> Vec<MultiLevelRule> {
94    spec.split(';')
95        .map(str::trim)
96        .filter(|s| !s.is_empty())
97        .filter_map(parse_multi_level_spec)
98        .collect()
99}
100
101/// Parse disassemble args: `<path> [options]`.
102///
103/// Iteration is driven by `args.iter()` rather than a manual `let mut i =
104/// 0; while i < args.len()` cursor so that every option handler advances
105/// the cursor by consuming the iterator. The previous index-based loop
106/// scattered ~22 `i += 1` expressions across the body; every `+= -> -=`
107/// or `+= -> *=` mutation on those lines produces an infinite loop (the
108/// outer `while` never terminates because `i` either wraps around on
109/// usize underflow or stays put), which `cargo-mutants` can only
110/// classify as `timeout`. That added ~36 timeouts and ~36 minutes of
111/// wall-clock to every full sweep with no actual signal. The iterator
112/// form removes those mutation sites entirely; behavior is unchanged
113/// and covered by the existing `parse_disassemble_args_*` tests.
114pub fn parse_disassemble_args(args: &[String]) -> DisassembleOpts<'_> {
115    let mut path = None;
116    let mut unique_id_elements = None;
117    let mut pre_purge = false;
118    let mut post_purge = false;
119    let mut ignore_path: Option<&str> = None;
120    let mut format = "xml";
121    let mut strategy = None;
122    let mut multi_level = None;
123    let mut split_tags = None;
124    let mut sidecar_elements = None;
125
126    let mut iter = args.iter();
127    while let Some(arg) = iter.next() {
128        if arg == "--postpurge" {
129            post_purge = true;
130        } else if arg == "--prepurge" {
131            pre_purge = true;
132        } else if let Some(rest) = arg.strip_prefix("--unique-id-elements=") {
133            unique_id_elements = Some(rest);
134        } else if arg == "--unique-id-elements" {
135            if let Some(value) = iter.next() {
136                unique_id_elements = Some(value.as_str());
137            }
138        } else if let Some(rest) = arg.strip_prefix("--ignore-path=") {
139            ignore_path = Some(rest);
140        } else if arg == "--ignore-path" {
141            if let Some(value) = iter.next() {
142                ignore_path = Some(value.as_str());
143            }
144        } else if let Some(rest) = arg.strip_prefix("--format=") {
145            format = rest;
146        } else if arg == "--format" {
147            if let Some(value) = iter.next() {
148                format = value.as_str();
149            }
150        } else if let Some(rest) = arg.strip_prefix("--strategy=") {
151            strategy = Some(rest);
152        } else if arg == "--strategy" {
153            if let Some(value) = iter.next() {
154                strategy = Some(value.as_str());
155            }
156        } else if let Some(rest) = arg.strip_prefix("--multi-level=") {
157            multi_level = Some(rest.to_string());
158        } else if arg == "--multi-level" {
159            if let Some(value) = iter.next() {
160                multi_level = Some(value.clone());
161            }
162        } else if let Some(rest) = arg.strip_prefix("--split-tags=") {
163            split_tags = Some(rest.to_string());
164        } else if arg == "--split-tags" || arg == "-p" {
165            if let Some(value) = iter.next() {
166                split_tags = Some(value.clone());
167            }
168        } else if let Some(rest) = arg.strip_prefix("--sidecar-elements=") {
169            sidecar_elements = Some(rest.to_string());
170        } else if arg == "--sidecar-elements" {
171            if let Some(value) = iter.next() {
172                sidecar_elements = Some(value.clone());
173            }
174        } else if arg.starts_with("--") {
175            // Unknown long flag: silently skipped (matches the legacy
176            // index-based parser, whose tests pin this behavior via
177            // `parse_disassemble_args_unknown_long_flag_is_skipped`).
178        } else if path.is_none() {
179            path = Some(arg.as_str());
180        }
181        // Else: extra positional argument, dropped silently to match the
182        // legacy parser (covered by
183        // `parse_disassemble_args_trailing_extra_positional_ignored`).
184    }
185
186    DisassembleOpts {
187        path,
188        unique_id_elements,
189        pre_purge,
190        post_purge,
191        ignore_path,
192        format,
193        strategy,
194        multi_level,
195        split_tags,
196        sidecar_elements,
197    }
198}
199
200/// Parse reassemble args: `<path> [extension] [--postpurge]`.
201pub fn parse_reassemble_args(args: &[String]) -> (Option<&str>, Option<&str>, bool) {
202    let mut path = None;
203    let mut extension = None;
204    let mut post_purge = false;
205    for arg in args.iter() {
206        if arg == "--postpurge" {
207            post_purge = true;
208        } else if path.is_none() {
209            path = Some(arg.as_str());
210        } else if extension.is_none() {
211            extension = Some(arg.as_str());
212        }
213    }
214    (path, extension, post_purge)
215}
216
217/// Parse a `--sidecar-elements` spec string into a list of [`SidecarSpec`]s.
218///
219/// Input format: comma-separated `element:extension` pairs, e.g.
220/// `"schema:yaml"` or `"schema:yaml,wsdl:wsdl"`. Malformed pairs (missing
221/// colon, empty element or extension) are silently dropped.
222pub fn parse_sidecar_specs(spec: &str) -> Vec<SidecarSpec> {
223    spec.split(',')
224        .map(str::trim)
225        .filter_map(|pair| {
226            let (element, extension) = pair.split_once(':')?;
227            let element = element.trim().to_string();
228            let extension = extension.trim().to_string();
229            if element.is_empty() || extension.is_empty() {
230                return None;
231            }
232            Some(SidecarSpec {
233                element,
234                extension,
235                original_format: None,
236            })
237        })
238        .collect()
239}
240
241/// Print CLI usage to stderr.
242pub fn print_usage() {
243    eprintln!("Usage: xml-disassembler <command> [options]");
244    eprintln!("  disassemble <path> [options]     - Disassemble XML file or directory");
245    eprintln!("    --postpurge                    - Delete original file/dir after disassembling (default: false)");
246    eprintln!("    --prepurge                     - Remove existing disassembly output before running (default: false)");
247    eprintln!(
248        "    --unique-id-elements <list>    - Comma-separated element names for nested filenames"
249    );
250    eprintln!("    --ignore-path <path>           - Path to ignore file (default: .cdignore; falls back to .xmldisassemblerignore for backward compatibility)");
251    eprintln!(
252        "    --format <fmt>                 - Output format: xml, json, json5, yaml (default: xml)"
253    );
254    eprintln!(
255        "    --strategy <name>              - unique-id or grouped-by-tag (default: unique-id)"
256    );
257    eprintln!("    --multi-level <spec>          - Further disassemble matching files: file_pattern:root_to_strip:unique_id_elements (multiple rules separated by ';')");
258    eprintln!("    -p, --split-tags <spec>       - With grouped-by-tag: split/group nested tags (e.g. objectPermissions:split:object,fieldPermissions:group:field)");
259    eprintln!("    --sidecar-elements <spec>     - Extract element text to companion files: element:extension (comma-separated, e.g. schema:yaml)");
260    eprintln!("  reassemble <path> [extension] [--postpurge]  - Reassemble directory (default extension: xml); sidecar specs are auto-detected from .sidecars.json");
261}
262
263/// True when `args` only contains the program name (or is empty).
264/// Pure helper extracted from `run` so the `args.len() < 2` guard
265/// can be exercised at every boundary without spawning a process.
266fn should_print_usage(args_len: usize) -> bool {
267    args_len < 2
268}
269
270/// True when the user supplied a `--multi-level` spec that didn't
271/// parse into any rules. Pure helper extracted from `run_disassemble`
272/// so both legs of `spec.is_some() && parsed.is_empty()` are testable.
273fn multi_level_spec_failed_to_parse(spec_present: bool, parsed_empty: bool) -> bool {
274    spec_present && parsed_empty
275}
276
277/// True when the strategy is `grouped-by-tag` and decompose-spec
278/// parsing should run. Extracting this guard avoids paying the cost
279/// of parsing `--split-tags` (and triggering its destructive
280/// behaviours under mutation testing) for any other strategy.
281fn should_parse_decompose_rules(strategy: &str) -> bool {
282    strategy == "grouped-by-tag"
283}
284
285/// Run the CLI with the given args. `args[0]` is expected to be the program name.
286pub async fn run(args: Vec<String>) -> Result<(), Box<dyn std::error::Error + Send + Sync>> {
287    if should_print_usage(args.len()) {
288        print_usage();
289        return Ok(());
290    }
291
292    let command = &args[1];
293    match command.as_str() {
294        "disassemble" => run_disassemble(&args[2..]).await?,
295        "reassemble" => run_reassemble(&args[2..]).await?,
296        _ => {
297            eprintln!("Unknown command: {}", command);
298        }
299    }
300
301    Ok(())
302}
303
304async fn run_disassemble(args: &[String]) -> Result<(), Box<dyn std::error::Error + Send + Sync>> {
305    let opts = parse_disassemble_args(args);
306    let path = opts.path.unwrap_or(".");
307    let strategy = opts.strategy.unwrap_or("unique-id");
308    let multi_level_rules: Vec<MultiLevelRule> = opts
309        .multi_level
310        .as_deref()
311        .map(parse_multi_level_specs)
312        .unwrap_or_default();
313    if multi_level_spec_failed_to_parse(opts.multi_level.is_some(), multi_level_rules.is_empty()) {
314        eprintln!("Invalid --multi-level spec; use file_pattern:root_to_strip:unique_id_elements (multiple rules separated by ';')");
315    }
316    let decompose_rules: Vec<DecomposeRule> = if should_parse_decompose_rules(strategy) {
317        opts.split_tags
318            .as_ref()
319            .map(|s| parse_decompose_spec(s))
320            .unwrap_or_default()
321    } else {
322        Vec::new()
323    };
324    let decompose_rules_ref = if decompose_rules.is_empty() {
325        None
326    } else {
327        Some(decompose_rules.as_slice())
328    };
329    let cwd = std::env::current_dir().unwrap_or_else(|_| std::path::Path::new(".").to_path_buf());
330    let resolved_ignore = crate::ignore_file::resolve_xml_ignore_path(opts.ignore_path, &cwd);
331    let multi_level_rules_ref = if multi_level_rules.is_empty() {
332        None
333    } else {
334        Some(multi_level_rules.as_slice())
335    };
336    let sidecar_specs: Vec<SidecarSpec> = opts
337        .sidecar_elements
338        .as_deref()
339        .map(parse_sidecar_specs)
340        .unwrap_or_default();
341    let sidecar_specs_ref = if sidecar_specs.is_empty() {
342        None
343    } else {
344        Some(sidecar_specs.as_slice())
345    };
346    let mut handler = DisassembleXmlFileHandler::new();
347    handler
348        .disassemble(
349            path,
350            opts.unique_id_elements,
351            Some(strategy),
352            opts.pre_purge,
353            opts.post_purge,
354            &resolved_ignore,
355            opts.format,
356            multi_level_rules_ref,
357            decompose_rules_ref,
358            sidecar_specs_ref,
359        )
360        .await?;
361    Ok(())
362}
363
364async fn run_reassemble(args: &[String]) -> Result<(), Box<dyn std::error::Error + Send + Sync>> {
365    let (path, extension, post_purge) = parse_reassemble_args(args);
366    let path = path.unwrap_or(".");
367    let handler = ReassembleXmlFileHandler::new();
368    handler
369        .reassemble(path, extension.or(Some("xml")), post_purge, None)
370        .await?;
371    Ok(())
372}
373
374#[cfg(test)]
375mod tests {
376    use super::*;
377
378    fn sv(s: &str) -> String {
379        s.to_string()
380    }
381
382    #[test]
383    fn parse_decompose_spec_three_segments_defaults_path_segment_to_tag() {
384        let rules = parse_decompose_spec("objectPermissions:split:object");
385        assert_eq!(rules.len(), 1);
386        let r = &rules[0];
387        assert_eq!(r.tag, "objectPermissions");
388        assert_eq!(r.path_segment, "objectPermissions");
389        assert_eq!(r.mode, "split");
390        assert_eq!(r.field, "object");
391    }
392
393    #[test]
394    fn parse_decompose_spec_four_segments_uses_explicit_path_segment() {
395        let rules = parse_decompose_spec("fieldPermissions:fieldPerms:group:field");
396        assert_eq!(rules.len(), 1);
397        let r = &rules[0];
398        assert_eq!(r.tag, "fieldPermissions");
399        assert_eq!(r.path_segment, "fieldPerms");
400        assert_eq!(r.mode, "group");
401        assert_eq!(r.field, "field");
402    }
403
404    #[test]
405    fn parse_decompose_spec_comma_separated_rules_trims_whitespace() {
406        let rules = parse_decompose_spec("a:split:f, b:group:g , c:x:split:y");
407        assert_eq!(rules.len(), 3);
408        assert_eq!(rules[0].tag, "a");
409        assert_eq!(rules[1].tag, "b");
410        assert_eq!(rules[2].tag, "c");
411        assert_eq!(rules[2].path_segment, "x");
412    }
413
414    #[test]
415    fn parse_decompose_spec_rejects_empty_segments() {
416        // Too few segments
417        assert!(parse_decompose_spec("only:two").is_empty());
418        // Empty tag, mode, or field are filtered
419        assert!(parse_decompose_spec(":split:field").is_empty());
420        assert!(parse_decompose_spec("tag::field").is_empty());
421        assert!(parse_decompose_spec("tag:split:").is_empty());
422    }
423
424    #[test]
425    fn parse_multi_level_spec_valid_returns_rule() {
426        let rule = parse_multi_level_spec(
427            "programProcesses-meta:LoyaltyProgramSetup:parameterName,ruleName",
428        )
429        .unwrap();
430        assert_eq!(rule.file_pattern, "programProcesses-meta");
431        assert_eq!(rule.root_to_strip, "LoyaltyProgramSetup");
432        assert_eq!(rule.unique_id_elements, "parameterName,ruleName");
433        assert_eq!(rule.path_segment, "programProcesses");
434        assert_eq!(rule.wrap_root_element, "LoyaltyProgramSetup");
435        assert!(rule.wrap_xmlns.is_empty());
436    }
437
438    #[test]
439    fn parse_multi_level_spec_rejects_wrong_parts() {
440        assert!(parse_multi_level_spec("only:two").is_none());
441        assert!(parse_multi_level_spec(":Root:ids").is_none());
442        assert!(parse_multi_level_spec("file::ids").is_none());
443        assert!(parse_multi_level_spec("file:Root:").is_none());
444    }
445
446    #[test]
447    fn parse_multi_level_specs_single_rule_returns_one() {
448        let rules = parse_multi_level_specs("a-meta:Root:id");
449        assert_eq!(rules.len(), 1);
450        assert_eq!(rules[0].file_pattern, "a-meta");
451    }
452
453    #[test]
454    fn parse_multi_level_specs_semicolon_separates_rules() {
455        let rules =
456            parse_multi_level_specs("a-meta:RootA:id1,id2; b-meta:RootB:other ; c-meta:RootC:k");
457        assert_eq!(rules.len(), 3);
458        assert_eq!(rules[0].file_pattern, "a-meta");
459        assert_eq!(rules[0].unique_id_elements, "id1,id2");
460        assert_eq!(rules[1].file_pattern, "b-meta");
461        assert_eq!(rules[1].root_to_strip, "RootB");
462        assert_eq!(rules[2].file_pattern, "c-meta");
463    }
464
465    #[test]
466    fn parse_multi_level_specs_skips_empty_and_malformed() {
467        // Trailing semicolons and malformed rules are dropped without aborting the rest.
468        let rules = parse_multi_level_specs("a:R:id; ; bad ; b:R:id;");
469        assert_eq!(rules.len(), 2);
470        assert_eq!(rules[0].file_pattern, "a");
471        assert_eq!(rules[1].file_pattern, "b");
472    }
473
474    #[test]
475    fn parse_multi_level_specs_empty_string_returns_empty() {
476        assert!(parse_multi_level_specs("").is_empty());
477        assert!(parse_multi_level_specs(" ; ;").is_empty());
478    }
479
480    #[test]
481    fn parse_disassemble_args_handles_flags_and_eq_forms() {
482        let args = [
483            "path/to/file.xml",
484            "--postpurge",
485            "--prepurge",
486            "--unique-id-elements=name,id",
487            "--ignore-path=.foo",
488            "--format=json",
489            "--strategy=grouped-by-tag",
490            "--multi-level=pattern:Root:ids",
491            "--split-tags=a:split:b",
492        ]
493        .iter()
494        .map(|s| sv(s))
495        .collect::<Vec<_>>();
496        let opts = parse_disassemble_args(&args);
497        assert_eq!(opts.path, Some("path/to/file.xml"));
498        assert!(opts.pre_purge);
499        assert!(opts.post_purge);
500        assert_eq!(opts.unique_id_elements, Some("name,id"));
501        assert_eq!(opts.ignore_path, Some(".foo"));
502        assert_eq!(opts.format, "json");
503        assert_eq!(opts.strategy, Some("grouped-by-tag"));
504        assert_eq!(opts.multi_level.as_deref(), Some("pattern:Root:ids"));
505        assert_eq!(opts.split_tags.as_deref(), Some("a:split:b"));
506    }
507
508    #[test]
509    fn parse_disassemble_args_handles_space_separated_forms() {
510        let args = [
511            "file.xml",
512            "--unique-id-elements",
513            "name",
514            "--ignore-path",
515            ".gitignore",
516            "--format",
517            "yaml",
518            "--strategy",
519            "unique-id",
520            "--multi-level",
521            "p:R:ids",
522            "--split-tags",
523            "t:split:f",
524        ]
525        .iter()
526        .map(|s| sv(s))
527        .collect::<Vec<_>>();
528        let opts = parse_disassemble_args(&args);
529        assert_eq!(opts.path, Some("file.xml"));
530        assert_eq!(opts.unique_id_elements, Some("name"));
531        assert_eq!(opts.ignore_path, Some(".gitignore"));
532        assert_eq!(opts.format, "yaml");
533        assert_eq!(opts.strategy, Some("unique-id"));
534        assert_eq!(opts.multi_level.as_deref(), Some("p:R:ids"));
535        assert_eq!(opts.split_tags.as_deref(), Some("t:split:f"));
536    }
537
538    #[test]
539    fn parse_disassemble_args_space_form_value_is_not_misread_as_positional_path() {
540        // For every option that accepts a value in separated form, when the option
541        // is the leading argument and no positional path precedes it, the captured
542        // value must not be re-treated as the positional path. This pins down the
543        // `i += 1` advance after a value is consumed (regression: a missed advance
544        // would cause the parser to revisit the value on the next iteration and
545        // store it in `path`).
546        let cases: &[(&[&str], &str)] = &[
547            (&["--unique-id-elements", "name"], "name"),
548            (&["--ignore-path", ".foo"], ".foo"),
549            (&["--format", "yaml"], "yaml"),
550            (&["--strategy", "grouped-by-tag"], "grouped-by-tag"),
551            (&["--multi-level", "p:R:ids"], "p:R:ids"),
552            (&["--split-tags", "t:split:f"], "t:split:f"),
553            (&["-p", "t:split:f"], "t:split:f"),
554        ];
555        for (args, expected_value) in cases {
556            let owned: Vec<String> = args.iter().map(|s| sv(s)).collect();
557            let opts = parse_disassemble_args(&owned);
558            assert!(
559                opts.path.is_none(),
560                "args {args:?}: value `{expected_value}` was incorrectly captured as path"
561            );
562        }
563    }
564
565    #[test]
566    fn parse_disassemble_args_space_form_value_missing_does_not_panic() {
567        // When a value-consuming option is the last arg with no following value,
568        // the bounds check (`if i < args.len()`) must prevent an out-of-bounds
569        // read. Each of these inputs would panic if the bounds check is mutated
570        // from `<` to `<=`.
571        let options = [
572            "--unique-id-elements",
573            "--ignore-path",
574            "--format",
575            "--strategy",
576            "--multi-level",
577            "--split-tags",
578            "-p",
579        ];
580        for opt in options {
581            let args = [opt].iter().map(|s| sv(s)).collect::<Vec<_>>();
582            let opts = parse_disassemble_args(&args);
583            // The defaults assertion is incidental; the real assertion is that
584            // the call above does not panic.
585            assert!(opts.path.is_none(), "bare option `{opt}` set a path");
586        }
587    }
588
589    #[test]
590    fn parse_disassemble_args_p_alias_for_split_tags() {
591        let args = ["file.xml", "-p", "a:split:b"]
592            .iter()
593            .map(|s| sv(s))
594            .collect::<Vec<_>>();
595        let opts = parse_disassemble_args(&args);
596        assert_eq!(opts.split_tags.as_deref(), Some("a:split:b"));
597    }
598
599    #[test]
600    fn parse_disassemble_args_unknown_long_flag_is_skipped() {
601        let args = ["file.xml", "--unknown"]
602            .iter()
603            .map(|s| sv(s))
604            .collect::<Vec<_>>();
605        let opts = parse_disassemble_args(&args);
606        assert_eq!(opts.path, Some("file.xml"));
607    }
608
609    #[test]
610    fn parse_disassemble_args_defaults_when_empty() {
611        let opts = parse_disassemble_args(&[]);
612        assert!(opts.path.is_none());
613        assert!(opts.strategy.is_none());
614        assert!(opts.unique_id_elements.is_none());
615        assert!(!opts.pre_purge);
616        assert!(!opts.post_purge);
617        assert!(
618            opts.ignore_path.is_none(),
619            "default is `None` so the runner can pick the right filename"
620        );
621        assert_eq!(opts.format, "xml");
622    }
623
624    #[test]
625    fn parse_disassemble_args_space_forms_without_value_leave_default() {
626        let args = ["--unique-id-elements"]
627            .iter()
628            .map(|s| sv(s))
629            .collect::<Vec<_>>();
630        let opts = parse_disassemble_args(&args);
631        assert!(opts.unique_id_elements.is_none());
632    }
633
634    #[test]
635    fn parse_disassemble_args_trailing_extra_positional_ignored() {
636        let args = ["first.xml", "second.xml"]
637            .iter()
638            .map(|s| sv(s))
639            .collect::<Vec<_>>();
640        let opts = parse_disassemble_args(&args);
641        assert_eq!(opts.path, Some("first.xml"));
642    }
643
644    #[test]
645    fn parse_reassemble_args_picks_path_extension_and_flag() {
646        let args = ["some/dir", "json", "--postpurge"]
647            .iter()
648            .map(|s| sv(s))
649            .collect::<Vec<_>>();
650        let (path, ext, purge) = parse_reassemble_args(&args);
651        assert_eq!(path, Some("some/dir"));
652        assert_eq!(ext, Some("json"));
653        assert!(purge);
654    }
655
656    #[test]
657    fn parse_reassemble_args_defaults_and_extra_args_ignored() {
658        let (p, e, purge) = parse_reassemble_args(&[]);
659        assert!(p.is_none());
660        assert!(e.is_none());
661        assert!(!purge);
662
663        let args = ["dir", "xml", "extra"]
664            .iter()
665            .map(|s| sv(s))
666            .collect::<Vec<_>>();
667        let (p, e, _) = parse_reassemble_args(&args);
668        assert_eq!(p, Some("dir"));
669        assert_eq!(e, Some("xml"));
670    }
671
672    #[tokio::test]
673    async fn run_no_args_prints_usage_and_succeeds() {
674        run(vec![sv("xml-disassembler")]).await.unwrap();
675    }
676
677    #[tokio::test]
678    async fn run_unknown_command_is_not_an_error() {
679        run(vec![sv("xml-disassembler"), sv("unknown")])
680            .await
681            .unwrap();
682    }
683
684    #[tokio::test]
685    async fn run_reassemble_missing_path_returns_err() {
686        // Missing directory path propagates an error from fs::metadata.
687        let err = run(vec![
688            sv("xml-disassembler"),
689            sv("reassemble"),
690            sv("/definitely/not/here/xyz"),
691        ])
692        .await;
693        assert!(err.is_err());
694    }
695
696    #[tokio::test]
697    async fn run_disassemble_writes_expected_output() {
698        let dir = tempfile::tempdir().unwrap();
699        let xml_path = dir.path().join("sample.xml");
700        let xml = r#"<?xml version="1.0" encoding="UTF-8"?>
701<Root xmlns="http://example.com">
702  <child><name>one</name></child>
703  <child><name>two</name></child>
704</Root>"#;
705        std::fs::write(&xml_path, xml).unwrap();
706        run(vec![
707            sv("xml-disassembler"),
708            sv("disassemble"),
709            xml_path.to_string_lossy().to_string(),
710        ])
711        .await
712        .unwrap();
713        assert!(dir.path().join("sample").exists());
714    }
715
716    #[tokio::test]
717    async fn run_disassemble_with_invalid_multi_level_spec_warns_and_continues() {
718        let dir = tempfile::tempdir().unwrap();
719        let xml_path = dir.path().join("sample.xml");
720        let xml =
721            r#"<?xml version="1.0" encoding="UTF-8"?><Root><child><name>a</name></child></Root>"#;
722        std::fs::write(&xml_path, xml).unwrap();
723        run(vec![
724            sv("xml-disassembler"),
725            sv("disassemble"),
726            xml_path.to_string_lossy().to_string(),
727            sv("--multi-level=bad-spec"),
728        ])
729        .await
730        .unwrap();
731    }
732
733    #[tokio::test]
734    async fn run_reassemble_on_existing_directory_succeeds() {
735        // Disassemble then reassemble via the CLI to cover the success path end-to-end.
736        let dir = tempfile::tempdir().unwrap();
737        let xml_path = dir.path().join("reasm.xml");
738        let xml = r#"<?xml version="1.0" encoding="UTF-8"?>
739<Root><child><name>one</name></child><child><name>two</name></child></Root>"#;
740        std::fs::write(&xml_path, xml).unwrap();
741        run(vec![
742            sv("xml-disassembler"),
743            sv("disassemble"),
744            xml_path.to_string_lossy().to_string(),
745        ])
746        .await
747        .unwrap();
748        let disassembled_dir = dir.path().join("reasm");
749        assert!(disassembled_dir.exists());
750        run(vec![
751            sv("xml-disassembler"),
752            sv("reassemble"),
753            disassembled_dir.to_string_lossy().to_string(),
754        ])
755        .await
756        .unwrap();
757    }
758
759    #[tokio::test]
760    async fn run_disassemble_with_grouped_by_tag_no_split_tags_uses_empty_decompose_rules() {
761        // grouped-by-tag with no --split-tags: decompose_rules falls back to Vec::new()
762        // via `unwrap_or_default()` and decompose_rules_ref becomes None.
763        let dir = tempfile::tempdir().unwrap();
764        let xml_path = dir.path().join("sample.xml");
765        let xml =
766            r#"<?xml version="1.0" encoding="UTF-8"?><Root><a><n>1</n></a><b><n>2</n></b></Root>"#;
767        std::fs::write(&xml_path, xml).unwrap();
768        run(vec![
769            sv("xml-disassembler"),
770            sv("disassemble"),
771            xml_path.to_string_lossy().to_string(),
772            sv("--strategy=grouped-by-tag"),
773        ])
774        .await
775        .unwrap();
776    }
777
778    #[tokio::test]
779    async fn run_disassemble_with_grouped_by_tag_split_tags_runs() {
780        let dir = tempfile::tempdir().unwrap();
781        let xml_path = dir.path().join("perms.xml");
782        let xml = r#"<?xml version="1.0" encoding="UTF-8"?>
783<Root>
784  <objectPermissions><object>A</object><allowRead>true</allowRead></objectPermissions>
785  <objectPermissions><object>B</object><allowRead>false</allowRead></objectPermissions>
786</Root>"#;
787        std::fs::write(&xml_path, xml).unwrap();
788        run(vec![
789            sv("xml-disassembler"),
790            sv("disassemble"),
791            xml_path.to_string_lossy().to_string(),
792            sv("--strategy=grouped-by-tag"),
793            sv("-p"),
794            sv("objectPermissions:split:object"),
795        ])
796        .await
797        .unwrap();
798    }
799
800    #[test]
801    fn should_print_usage_only_for_fewer_than_two_args() {
802        // Pins each `<` mutant: `<=` would also trigger on len=2,
803        // `==` would miss len=0, `>` would invert the polarity.
804        assert!(should_print_usage(0));
805        assert!(should_print_usage(1));
806        assert!(!should_print_usage(2));
807        assert!(!should_print_usage(3));
808    }
809
810    #[test]
811    fn multi_level_spec_failed_to_parse_requires_both_conditions() {
812        // The warning must fire only when a spec was *provided* and
813        // parsing returned no rules — every other quadrant is silent.
814        assert!(multi_level_spec_failed_to_parse(true, true));
815        assert!(!multi_level_spec_failed_to_parse(true, false));
816        assert!(!multi_level_spec_failed_to_parse(false, true));
817        assert!(!multi_level_spec_failed_to_parse(false, false));
818    }
819
820    #[test]
821    fn should_parse_decompose_rules_only_for_grouped_by_tag() {
822        // Decompose rules are exclusive to `grouped-by-tag`. Mutating
823        // the original `==` to `!=` would forward decompose specs to
824        // the `unique-id` strategy and trigger downstream work that
825        // times out under cargo-mutants — testing the helper directly
826        // pins the operator without involving the async pipeline.
827        assert!(should_parse_decompose_rules("grouped-by-tag"));
828        assert!(!should_parse_decompose_rules("unique-id"));
829        assert!(!should_parse_decompose_rules(""));
830        assert!(!should_parse_decompose_rules("Grouped-By-Tag"));
831    }
832
833    #[tokio::test]
834    async fn run_disassemble_with_valid_multi_level_spec_passes_rules_slice() {
835        // A syntactically valid --multi-level spec causes multi_level_rules_ref to be
836        // Some(slice) (line 299 in run_disassemble), covering that branch.
837        let dir = tempfile::tempdir().unwrap();
838        let xml_path = dir.path().join("sample.xml");
839        let xml =
840            r#"<?xml version="1.0" encoding="UTF-8"?><Root><child><name>a</name></child></Root>"#;
841        std::fs::write(&xml_path, xml).unwrap();
842        run(vec![
843            sv("xml-disassembler"),
844            sv("disassemble"),
845            xml_path.to_string_lossy().to_string(),
846            sv("--multi-level=child:Root:name"),
847        ])
848        .await
849        .unwrap();
850    }
851
852    #[test]
853    fn parse_sidecar_specs_empty_element_is_dropped() {
854        // `:yaml` — element part is empty; must not produce a spec.
855        let specs = parse_sidecar_specs(":yaml");
856        assert!(specs.is_empty(), "expected no specs, got: {specs:?}");
857    }
858
859    #[test]
860    fn parse_sidecar_specs_empty_extension_is_dropped() {
861        // `schema:` — extension part is empty; must not produce a spec.
862        let specs = parse_sidecar_specs("schema:");
863        assert!(specs.is_empty(), "expected no specs, got: {specs:?}");
864    }
865}