Skip to main content

kaish_types/
output.rs

1//! Structured output model (Tree-of-Tables) and output format handling.
2//!
3//! The unified output model uses `OutputData` containing a tree of `OutputNode`s:
4//!
5//! - **Builtins**: Pure data producers returning `OutputData`
6//! - **Frontends**: Handle all rendering (REPL, MCP, kaijutsu)
7
8use serde::{Deserialize, Serialize};
9
10use crate::result::ExecResult;
11
12// ============================================================
13// Structured Output (Tree-of-Tables Model)
14// ============================================================
15
16/// Entry type for rendering hints (colors, icons).
17///
18/// This unified enum is used by both the new OutputNode system
19/// and the legacy DisplayHint::Table for backward compatibility.
20#[non_exhaustive]
21#[derive(Debug, Clone, Copy, PartialEq, Eq, Default, Serialize, Deserialize)]
22#[cfg_attr(feature = "schema", derive(schemars::JsonSchema))]
23#[serde(rename_all = "lowercase")]
24pub enum EntryType {
25    /// Generic text content.
26    #[default]
27    Text,
28    /// Regular file.
29    File,
30    /// Directory.
31    Directory,
32    /// Executable file.
33    Executable,
34    /// Symbolic link.
35    Symlink,
36}
37
38/// A node in the output tree.
39///
40/// All fields are always serialized (no skip_serializing_if) for predictable shape
41/// across JSON, postcard, and bincode formats.
42///
43/// `text` is Option<String> because None and Some("") are semantically distinct:
44/// - None: this is a named entry (file listing, table row), not a text node
45/// - Some(""): this IS a text node whose content is empty (e.g. `echo ""`)
46///
47/// The `is_text_only()` method depends on this distinction.
48#[derive(Debug, Clone, PartialEq, Eq, Default, Serialize, Deserialize)]
49#[cfg_attr(feature = "schema", derive(schemars::JsonSchema))]
50#[serde(default)]
51pub struct OutputNode {
52    /// Primary identifier (filename, key, label).
53    pub name: String,
54    /// Rendering hint (colors, icons).
55    pub entry_type: EntryType,
56    /// Text content (for echo, cat, exec).
57    ///
58    /// Three-state semantics:
59    /// - `None` — named entry (file listing, table row), not text
60    /// - `Some("")` — text node with empty content (e.g., `echo ""`)
61    /// - `Some("x")` — text node with content
62    ///
63    /// `is_text_only()` returns true iff text is Some AND name/cells/children are empty.
64    pub text: Option<String>,
65    /// Additional columns (for ls -l, ps, env).
66    pub cells: Vec<String>,
67    /// Child nodes (for tree, find).
68    pub children: Vec<OutputNode>,
69}
70
71impl OutputNode {
72    /// Create a new node with a name.
73    pub fn new(name: impl Into<String>) -> Self {
74        Self {
75            name: name.into(),
76            ..Default::default()
77        }
78    }
79
80    /// Create a text-only node (for echo, cat, etc.).
81    pub fn text(content: impl Into<String>) -> Self {
82        Self {
83            text: Some(content.into()),
84            ..Default::default()
85        }
86    }
87
88    /// Set the entry type for rendering hints.
89    pub fn with_entry_type(mut self, entry_type: EntryType) -> Self {
90        self.entry_type = entry_type;
91        self
92    }
93
94    /// Set additional columns for tabular output.
95    pub fn with_cells(mut self, cells: Vec<String>) -> Self {
96        self.cells = cells;
97        self
98    }
99
100    /// Set child nodes for tree output.
101    pub fn with_children(mut self, children: Vec<OutputNode>) -> Self {
102        self.children = children;
103        self
104    }
105
106    /// Set text content.
107    pub fn with_text(mut self, text: impl Into<String>) -> Self {
108        self.text = Some(text.into());
109        self
110    }
111
112    /// Check if this is a text-only node.
113    pub fn is_text_only(&self) -> bool {
114        self.text.is_some() && self.name.is_empty() && self.cells.is_empty() && self.children.is_empty()
115    }
116
117    /// Check if this node has children.
118    pub fn has_children(&self) -> bool {
119        !self.children.is_empty()
120    }
121
122    /// Estimate brace-notation byte size without materializing.
123    pub fn estimated_byte_size(&self) -> usize {
124        if self.children.is_empty() {
125            self.name.len() + self.text.as_ref().map_or(0, |t| t.len())
126        } else {
127            // "name/{child1,child2,...}"
128            let mut size = self.name.len() + 2; // name + "/{" + "}"
129            for (i, child) in self.children.iter().enumerate() {
130                if i > 0 {
131                    size += 1; // comma separator
132                }
133                size += child.estimated_byte_size();
134            }
135            size + 1 // closing brace
136        }
137    }
138
139    /// Write brace-notation to a writer. Returns bytes written.
140    pub fn write_canonical(&self, w: &mut dyn std::io::Write, budget: usize) -> std::io::Result<usize> {
141        if self.children.is_empty() {
142            w.write_all(self.name.as_bytes())?;
143            return Ok(self.name.len());
144        }
145        let mut written = 0;
146        w.write_all(self.name.as_bytes())?;
147        written += self.name.len();
148        if written >= budget {
149            return Ok(written);
150        }
151        w.write_all(b"/{")?;
152        written += 2;
153        for (i, child) in self.children.iter().enumerate() {
154            if written >= budget {
155                break;
156            }
157            if i > 0 {
158                w.write_all(b",")?;
159                written += 1;
160            }
161            written += child.write_canonical(w, budget.saturating_sub(written))?;
162        }
163        w.write_all(b"}")?;
164        written += 1;
165        Ok(written)
166    }
167
168    /// Get the display name, potentially with text content.
169    pub fn display_name(&self) -> &str {
170        if self.name.is_empty() {
171            self.text.as_deref().unwrap_or("")
172        } else {
173            &self.name
174        }
175    }
176}
177
178/// Structured output data from a command.
179///
180/// This is the top-level structure for command output.
181/// It contains optional column headers and a list of root nodes.
182///
183/// `headers` is Option<Vec<String>> because None means "not tabular" while
184/// Some(vec![]) means "tabular with no column headers." The rendering dispatch
185/// in to_json() and the REPL formatter branch on this distinction.
186///
187/// # Rendering Rules
188///
189/// | Structure | Interactive | Piped/Model |
190/// |-----------|-------------|-------------|
191/// | Single node with `text` | Print text | Print text |
192/// | Flat nodes, `name` only | Multi-column, colored | One per line |
193/// | Flat nodes with `cells` | Aligned table | TSV or names only |
194/// | Nested `children` | Box-drawing tree | Brace notation |
195#[derive(Debug, Clone, PartialEq, Eq, Default, Serialize, Deserialize)]
196#[cfg_attr(feature = "schema", derive(schemars::JsonSchema))]
197#[serde(default)]
198#[non_exhaustive]
199pub struct OutputData {
200    /// Column headers (optional, for table output).
201    pub headers: Option<Vec<String>>,
202    /// Top-level nodes.
203    pub root: Vec<OutputNode>,
204    /// Render-only override for `--json` consumers. When `Some`,
205    /// `to_json()` returns this verbatim instead of inferring from
206    /// `headers` / `root` / `cells`. Use it when a builtin wants its
207    /// `--json` shape to be richer than the table form (e.g. grep
208    /// emitting per-match objects with submatches and byte offsets).
209    ///
210    /// Skipped by serde (and thus by postcard / bincode) — this is a
211    /// transient render hint, not part of the persisted shape.
212    #[serde(skip)]
213    #[cfg_attr(feature = "schema", schemars(skip))]
214    pub rich_json: Option<serde_json::Value>,
215}
216
217impl OutputData {
218    /// Create new empty output data.
219    pub fn new() -> Self {
220        Self::default()
221    }
222
223    /// Create output data with a single text node.
224    ///
225    /// This is the simplest form for commands like `echo`.
226    pub fn text(content: impl Into<String>) -> Self {
227        Self {
228            headers: None,
229            root: vec![OutputNode::text(content)],
230            rich_json: None,
231        }
232    }
233
234    /// Create output data with named nodes (for ls, etc.).
235    pub fn nodes(nodes: Vec<OutputNode>) -> Self {
236        Self {
237            headers: None,
238            root: nodes,
239            rich_json: None,
240        }
241    }
242
243    /// Create output data with headers and nodes (for ls -l, ps, etc.).
244    pub fn table(headers: Vec<String>, nodes: Vec<OutputNode>) -> Self {
245        Self {
246            headers: Some(headers),
247            root: nodes,
248            rich_json: None,
249        }
250    }
251
252    /// Set column headers.
253    pub fn with_headers(mut self, headers: Vec<String>) -> Self {
254        self.headers = Some(headers);
255        self
256    }
257
258    /// Attach a render-only `--json` override. See `rich_json` field doc.
259    pub fn with_rich_json(mut self, value: serde_json::Value) -> Self {
260        self.rich_json = Some(value);
261        self
262    }
263
264    /// Check if this output is simple text (single text-only node).
265    pub fn is_simple_text(&self) -> bool {
266        self.root.len() == 1 && self.root[0].is_text_only()
267    }
268
269    /// Check if this output is a flat list (no nested children).
270    pub fn is_flat(&self) -> bool {
271        self.root.iter().all(|n| !n.has_children())
272    }
273
274    /// Check if this output has tabular data (nodes with cells).
275    pub fn is_tabular(&self) -> bool {
276        self.root.iter().any(|n| !n.cells.is_empty())
277    }
278
279    /// Get the text content if this is simple text output.
280    pub fn as_text(&self) -> Option<&str> {
281        if self.is_simple_text() {
282            self.root[0].text.as_deref()
283        } else {
284            None
285        }
286    }
287
288    /// Extract the owned String from a single-text-node OutputData.
289    /// Returns `Err(self)` for non-simple-text output (tables, trees, multi-node),
290    /// giving the caller back the unconsumed OutputData.
291    pub fn into_text(mut self) -> Result<String, Self> {
292        if self.root.len() == 1 && self.root[0].is_text_only() {
293            Ok(self.root.pop().and_then(|n| n.text).unwrap_or_default())
294        } else {
295            Err(self)
296        }
297    }
298
299    /// Estimate canonical string byte size without materializing.
300    ///
301    /// Lower bound — actual may be slightly larger due to formatting.
302    /// Mirrors `to_canonical_string()` structure but only accumulates sizes.
303    pub fn estimated_byte_size(&self) -> usize {
304        if self.root.len() == 1 && self.root[0].is_text_only() {
305            return self.root[0].text.as_ref().map_or(0, |t| t.len());
306        }
307
308        if self.is_flat() {
309            let mut size = 0;
310            for (i, n) in self.root.iter().enumerate() {
311                if i > 0 {
312                    size += 1; // newline separator
313                }
314                size += n.display_name().len();
315                for cell in &n.cells {
316                    size += 1 + cell.len(); // tab + cell
317                }
318            }
319            return size;
320        }
321
322        // Tree: estimate brace notation
323        let mut size = 0;
324        for (i, n) in self.root.iter().enumerate() {
325            if i > 0 {
326                size += 1; // newline separator
327            }
328            size += n.estimated_byte_size();
329        }
330        size
331    }
332
333    /// Write canonical representation to a writer with optional byte budget.
334    ///
335    /// Returns total bytes written. Stops after budget exceeded (imprecise:
336    /// one write past the limit is fine — caller uses this for spill detection,
337    /// not for exact truncation).
338    pub fn write_canonical(&self, w: &mut dyn std::io::Write, budget: Option<usize>) -> std::io::Result<usize> {
339        let mut written = 0usize;
340        let budget = budget.unwrap_or(usize::MAX);
341
342        if self.root.len() == 1 && self.root[0].is_text_only() {
343            if let Some(ref text) = self.root[0].text {
344                w.write_all(text.as_bytes())?;
345                return Ok(text.len());
346            }
347            return Ok(0);
348        }
349
350        if self.is_flat() {
351            for (i, n) in self.root.iter().enumerate() {
352                if i > 0 {
353                    w.write_all(b"\n")?;
354                    written += 1;
355                }
356                let name = n.display_name();
357                w.write_all(name.as_bytes())?;
358                written += name.len();
359                for cell in &n.cells {
360                    w.write_all(b"\t")?;
361                    w.write_all(cell.as_bytes())?;
362                    written += 1 + cell.len();
363                }
364                if written > budget {
365                    return Ok(written);
366                }
367            }
368            return Ok(written);
369        }
370
371        // Tree: brace notation
372        for (i, n) in self.root.iter().enumerate() {
373            if i > 0 {
374                w.write_all(b"\n")?;
375                written += 1;
376            }
377            written += n.write_canonical(w, budget.saturating_sub(written))?;
378            if written > budget {
379                return Ok(written);
380            }
381        }
382        Ok(written)
383    }
384
385    /// Convert to canonical string output (for pipes).
386    ///
387    /// This produces a simple string representation suitable for
388    /// piping to other commands:
389    /// - Text nodes: their text content
390    /// - Named nodes: names joined by newlines
391    /// - Tabular nodes (name + cells): TSV format (name\tcell1\tcell2...)
392    /// - Nested nodes: brace notation
393    pub fn to_canonical_string(&self) -> String {
394        if let Some(text) = self.as_text() {
395            return text.to_string();
396        }
397
398        // For flat lists (with or without cells), output one line per node
399        if self.is_flat() {
400            return self.root.iter()
401                .map(|n| {
402                    if n.cells.is_empty() {
403                        n.display_name().to_string()
404                    } else {
405                        // For tabular data, use TSV format
406                        let mut parts = vec![n.display_name().to_string()];
407                        parts.extend(n.cells.iter().cloned());
408                        parts.join("\t")
409                    }
410                })
411                .collect::<Vec<_>>()
412                .join("\n");
413        }
414
415        // For trees, use brace notation
416        fn format_node(node: &OutputNode) -> String {
417            if node.children.is_empty() {
418                node.name.clone()
419            } else {
420                let children: Vec<String> = node.children.iter()
421                    .map(format_node)
422                    .collect();
423                format!("{}/{{{}}}", node.name, children.join(","))
424            }
425        }
426
427        self.root.iter()
428            .map(format_node)
429            .collect::<Vec<_>>()
430            .join("\n")
431    }
432
433    /// Serialize to a JSON value for `--json` flag handling.
434    ///
435    /// Bare data, no envelope — optimized for `jq` patterns.
436    ///
437    /// | Structure | JSON |
438    /// |-----------|------|
439    /// | Simple text | `"hello world"` |
440    /// | Flat list (names only) | `["file1", "file2"]` |
441    /// | Table (headers + cells) | `[{"col1": "v1", ...}, ...]` |
442    /// | Tree (nested children) | `{"dir": {"file": null}}` |
443    pub fn to_json(&self) -> serde_json::Value {
444        // Builtin-supplied override wins (used by `grep --json` to expose
445        // submatches/byte offsets that don't fit the table model).
446        if let Some(rich) = &self.rich_json {
447            return rich.clone();
448        }
449        // Simple text -> JSON string
450        if let Some(text) = self.as_text() {
451            return serde_json::Value::String(text.to_string());
452        }
453
454        // Table -> array of objects keyed by headers. Nodes with children
455        // (e.g. `ls -lR`, where root nodes are directory groups holding the
456        // actual entries) nest those entries under a "children" key — dropping
457        // them would silently lose every file and size.
458        if let Some(ref headers) = self.headers {
459            fn row_to_json(node: &OutputNode, headers: &[String]) -> serde_json::Value {
460                let mut map = serde_json::Map::new();
461                // First header maps to node.name
462                if let Some(first) = headers.first() {
463                    map.insert(first.clone(), serde_json::Value::String(node.name.clone()));
464                }
465                // Remaining headers map to cells
466                for (header, cell) in headers.iter().skip(1).zip(node.cells.iter()) {
467                    map.insert(header.clone(), serde_json::Value::String(cell.clone()));
468                }
469                if !node.children.is_empty() {
470                    let children: Vec<serde_json::Value> = node
471                        .children
472                        .iter()
473                        .map(|child| row_to_json(child, headers))
474                        .collect();
475                    map.insert("children".to_string(), serde_json::Value::Array(children));
476                }
477                serde_json::Value::Object(map)
478            }
479            let rows: Vec<serde_json::Value> = self
480                .root
481                .iter()
482                .map(|node| row_to_json(node, headers))
483                .collect();
484            return serde_json::Value::Array(rows);
485        }
486
487        // Tree -> nested object
488        if !self.is_flat() {
489            fn node_to_json(node: &OutputNode) -> serde_json::Value {
490                if node.children.is_empty() {
491                    serde_json::Value::Null
492                } else {
493                    let mut map = serde_json::Map::new();
494                    for child in &node.children {
495                        map.insert(child.name.clone(), node_to_json(child));
496                    }
497                    serde_json::Value::Object(map)
498                }
499            }
500
501            // Single root node -> its children as the top-level object
502            if self.root.len() == 1 {
503                return node_to_json(&self.root[0]);
504            }
505            // Multiple root nodes -> object with each root as a key
506            let mut map = serde_json::Map::new();
507            for node in &self.root {
508                map.insert(node.name.clone(), node_to_json(node));
509            }
510            return serde_json::Value::Object(map);
511        }
512
513        // Flat list -> array of strings
514        let items: Vec<serde_json::Value> = self.root.iter()
515            .map(|n| serde_json::Value::String(n.display_name().to_string()))
516            .collect();
517        serde_json::Value::Array(items)
518    }
519}
520
521// ============================================================
522// Output Format (Global --json flag)
523// ============================================================
524
525/// Output serialization format, requested via global flags.
526#[non_exhaustive]
527#[derive(Debug, Clone, Copy, PartialEq, Eq)]
528pub enum OutputFormat {
529    /// JSON serialization via OutputData::to_json()
530    Json,
531}
532
533/// Transform an ExecResult into the requested output format.
534///
535/// Serializes regardless of exit code — commands like `diff` (exit 1 = files differ)
536/// and `grep` (exit 1 = no matches) use non-zero exits for semantic meaning,
537/// not errors. The `--json` contract must hold for all exit codes.
538pub fn apply_output_format(mut result: ExecResult, format: OutputFormat) -> ExecResult {
539    // Binary results serialize as the self-describing base64 envelope, never a
540    // lossy-decoded JSON string. See docs/binary-data.md.
541    if result.is_bytes() {
542        let envelope = crate::bytes::bytes_to_envelope(result.out_bytes().unwrap_or(&[]));
543        match format {
544            OutputFormat::Json => {
545                result.set_out(
546                    serde_json::to_string(&envelope).unwrap_or_else(|_| "null".to_string()),
547                );
548                result.data = Some(crate::result::json_to_value(envelope));
549                result.set_output(None);
550            }
551        }
552        return result;
553    }
554    if !result.has_output() && result.text_out().is_empty() {
555        // No stdout to format. A failure that carries a diagnostic message must
556        // still honor --json — otherwise the message leaks out as plain text
557        // even though structured output was requested. Emit a JSON error object
558        // so the contract holds on the error path. A clean non-zero exit with no
559        // message (e.g. `grep` no-match, exit 1) is not an error and stays empty.
560        if !result.ok() && !result.err.is_empty() {
561            match format {
562                OutputFormat::Json => {
563                    let obj = serde_json::json!({
564                        "error": result.err,
565                        "code": result.code,
566                    });
567                    result.data = Some(crate::result::json_to_value(obj.clone()));
568                    result.set_out(
569                        serde_json::to_string(&obj).unwrap_or_else(|_| "null".to_string()),
570                    );
571                }
572            }
573        }
574        return result;
575    }
576    match format {
577        OutputFormat::Json => {
578            if let Some(output) = result.output() {
579                let json_value = output.to_json();
580                // NLL: borrow of result via output ends here (json_value is owned)
581                result.set_out(serde_json::to_string(&json_value)
582                    .unwrap_or_else(|_| "null".to_string()));
583                result.data = Some(crate::result::json_to_value(json_value));
584            } else if let Some(data) = &result.data {
585                // Structured data already present (e.g. jq, any `success_with_data`
586                // builtin): serialize that, not the rendered text. Re-wrapping the
587                // text as a JSON string would double-encode it (`"1"` not `1`) and
588                // clobber the real value. `.data` is the structured truth.
589                let json_out = serde_json::to_string(&crate::result::value_to_json(data))
590                    .unwrap_or_else(|_| "null".to_string());
591                result.set_out(json_out);
592            } else {
593                // Text-only: wrap as JSON string. .data mirrors the same string.
594                let text = result.text_out().into_owned();
595                let json_out = serde_json::to_string(&text)
596                    .unwrap_or_else(|_| "null".to_string());
597                result.data = Some(crate::value::Value::String(text));
598                result.set_out(json_out);
599            }
600            // Clear sentinel — format already applied, prevents double-encoding
601            result.set_output(None);
602            result
603        }
604    }
605}
606
607#[cfg(test)]
608mod tests {
609    use super::*;
610
611    #[test]
612    fn entry_type_variants() {
613        assert_ne!(EntryType::File, EntryType::Directory);
614        assert_ne!(EntryType::Directory, EntryType::Executable);
615        assert_ne!(EntryType::Executable, EntryType::Symlink);
616    }
617
618    #[test]
619    fn to_json_simple_text() {
620        let output = OutputData::text("hello world");
621        assert_eq!(output.to_json(), serde_json::json!("hello world"));
622    }
623
624    #[test]
625    fn to_json_flat_list() {
626        let output = OutputData::nodes(vec![
627            OutputNode::new("file1"),
628            OutputNode::new("file2"),
629            OutputNode::new("file3"),
630        ]);
631        assert_eq!(output.to_json(), serde_json::json!(["file1", "file2", "file3"]));
632    }
633
634    #[test]
635    fn to_json_table() {
636        let output = OutputData::table(
637            vec!["NAME".into(), "SIZE".into(), "TYPE".into()],
638            vec![
639                OutputNode::new("foo.rs").with_cells(vec!["1024".into(), "file".into()]),
640                OutputNode::new("bar/").with_cells(vec!["4096".into(), "dir".into()]),
641            ],
642        );
643        assert_eq!(output.to_json(), serde_json::json!([
644            {"NAME": "foo.rs", "SIZE": "1024", "TYPE": "file"},
645            {"NAME": "bar/", "SIZE": "4096", "TYPE": "dir"},
646        ]));
647    }
648
649    #[test]
650    fn to_json_table_with_children() {
651        // `ls -lR --json` builds a table whose root nodes are directory
652        // groups and whose actual entries (with size/type cells) live in
653        // `children`. The table serializer must recurse into them or every
654        // file and size is silently dropped — corruption, not an error.
655        let output = OutputData::table(
656            vec!["NAME".into(), "TYPE".into(), "SIZE".into()],
657            vec![
658                OutputNode::new(".")
659                    .with_entry_type(EntryType::Directory)
660                    .with_children(vec![
661                        OutputNode::new("top.txt").with_cells(vec!["-".into(), "6".into()]),
662                        OutputNode::new("a").with_cells(vec!["d".into(), "60".into()]),
663                    ]),
664                OutputNode::new("a")
665                    .with_entry_type(EntryType::Directory)
666                    .with_children(vec![
667                        OutputNode::new("mid.txt").with_cells(vec!["-".into(), "3".into()]),
668                    ]),
669            ],
670        );
671        assert_eq!(output.to_json(), serde_json::json!([
672            {"NAME": ".", "children": [
673                {"NAME": "top.txt", "TYPE": "-", "SIZE": "6"},
674                {"NAME": "a", "TYPE": "d", "SIZE": "60"},
675            ]},
676            {"NAME": "a", "children": [
677                {"NAME": "mid.txt", "TYPE": "-", "SIZE": "3"},
678            ]},
679        ]));
680    }
681
682    #[test]
683    fn to_json_tree() {
684        let child1 = OutputNode::new("main.rs").with_entry_type(EntryType::File);
685        let child2 = OutputNode::new("utils.rs").with_entry_type(EntryType::File);
686        let subdir = OutputNode::new("lib")
687            .with_entry_type(EntryType::Directory)
688            .with_children(vec![child2]);
689        let root = OutputNode::new("src")
690            .with_entry_type(EntryType::Directory)
691            .with_children(vec![child1, subdir]);
692
693        let output = OutputData::nodes(vec![root]);
694        assert_eq!(output.to_json(), serde_json::json!({
695            "main.rs": null,
696            "lib": {"utils.rs": null},
697        }));
698    }
699
700    #[test]
701    fn to_json_tree_multiple_roots() {
702        let root1 = OutputNode::new("src")
703            .with_entry_type(EntryType::Directory)
704            .with_children(vec![OutputNode::new("main.rs")]);
705        let root2 = OutputNode::new("docs")
706            .with_entry_type(EntryType::Directory)
707            .with_children(vec![OutputNode::new("README.md")]);
708
709        let output = OutputData::nodes(vec![root1, root2]);
710        assert_eq!(output.to_json(), serde_json::json!({
711            "src": {"main.rs": null},
712            "docs": {"README.md": null},
713        }));
714    }
715
716    #[test]
717    fn to_json_empty() {
718        let output = OutputData::new();
719        assert_eq!(output.to_json(), serde_json::json!([]));
720    }
721
722    #[test]
723    fn apply_output_format_clears_sentinel() {
724        let output = OutputData::table(
725            vec!["NAME".into()],
726            vec![OutputNode::new("test")],
727        );
728        let result = ExecResult::with_output(output);
729        assert!(result.has_output(), "before: sentinel present");
730
731        let formatted = apply_output_format(result, OutputFormat::Json);
732        assert!(!formatted.has_output(), "after Json: sentinel cleared");
733    }
734
735    #[test]
736    fn apply_output_format_no_double_encoding() {
737        let output = OutputData::nodes(vec![
738            OutputNode::new("file1"),
739            OutputNode::new("file2"),
740        ]);
741        let result = ExecResult::with_output(output);
742
743        let after_json = apply_output_format(result, OutputFormat::Json);
744        let json_out = after_json.text_out().into_owned();
745        assert!(!after_json.has_output(), "sentinel cleared by Json");
746
747        let parsed: serde_json::Value = serde_json::from_str(&json_out).expect("valid JSON");
748        assert_eq!(parsed, serde_json::json!(["file1", "file2"]));
749    }
750
751    #[test]
752    fn apply_output_format_populates_data() {
753        let output = OutputData::nodes(vec![
754            OutputNode::new("file1"),
755            OutputNode::new("file2"),
756        ]);
757        let result = ExecResult::with_output(output);
758        assert!(result.data.is_none(), "before: no data on non-text output");
759
760        let formatted = apply_output_format(result, OutputFormat::Json);
761        assert!(formatted.data.is_some(), "after Json: data populated");
762
763        // data should match the JSON in out
764        let data = formatted.data.unwrap();
765        assert!(matches!(data, crate::value::Value::Json(_)), "data should be Json variant");
766        if let crate::value::Value::Json(json) = data {
767            assert_eq!(json, serde_json::json!(["file1", "file2"]));
768        }
769    }
770
771    #[test]
772    fn apply_output_format_prefers_structured_data_over_text() {
773        // A `success_with_data` result (e.g. jq '.a' on {"a":1}) carries the
774        // structured scalar in `.data` and the rendered text in stdout. --json
775        // must serialize the structured value (1), not re-wrap the text ("1").
776        use crate::value::Value;
777        let result = ExecResult::success_with_data("1", Value::Int(1));
778        assert!(!result.has_output(), "no OutputData sentinel on this path");
779
780        let formatted = apply_output_format(result, OutputFormat::Json);
781        let json_out = formatted.text_out().into_owned();
782        let parsed: serde_json::Value = serde_json::from_str(&json_out).expect("valid JSON");
783        assert_eq!(parsed, serde_json::json!(1), "number, not the string \"1\"");
784        // The structured `.data` is preserved, not clobbered down to a string.
785        assert_eq!(formatted.data, Some(Value::Int(1)));
786    }
787
788    #[test]
789    fn apply_output_format_compact_json() {
790        let output = OutputData::nodes(vec![
791            OutputNode::new("file1"),
792            OutputNode::new("file2"),
793        ]);
794        let result = ExecResult::with_output(output);
795
796        let formatted = apply_output_format(result, OutputFormat::Json);
797        // Compact JSON: no pretty-printing (no newlines within the array)
798        let out = formatted.text_out();
799        assert!(!out.contains('\n'), "should be compact JSON, got: {}", out);
800        assert_eq!(&*out, r#"["file1","file2"]"#);
801    }
802
803    #[test]
804    fn apply_output_format_emits_json_error_object_on_failure() {
805        // A failure with empty stdout and a populated err must still honor
806        // --json: emit {"error", "code"} rather than leaking the message as
807        // plain text (e.g. `grep --json --bogus-flag`).
808        let result = ExecResult::failure(2, "grep: unknown flag --bogus-flag");
809        assert!(!result.has_output());
810        assert!(result.text_out().is_empty());
811
812        let formatted = apply_output_format(result, OutputFormat::Json);
813        let out = formatted.text_out().into_owned();
814        let parsed: serde_json::Value = serde_json::from_str(&out).expect("valid JSON");
815        assert_eq!(
816            parsed,
817            serde_json::json!({"error": "grep: unknown flag --bogus-flag", "code": 2})
818        );
819        // .data mirrors the JSON object.
820        assert!(matches!(formatted.data, Some(crate::value::Value::Json(_))));
821    }
822
823    #[test]
824    fn apply_output_format_leaves_clean_no_match_empty() {
825        // grep no-match: exit 1, empty stdout, empty err. Not an error — must
826        // NOT be wrapped in a JSON error object; stays empty.
827        let result = ExecResult::failure(1, "");
828        let formatted = apply_output_format(result, OutputFormat::Json);
829        assert!(formatted.text_out().is_empty());
830        assert!(formatted.data.is_none());
831    }
832
833    #[test]
834    fn apply_output_format_empty_success_stays_empty() {
835        let result = ExecResult::success("");
836        let formatted = apply_output_format(result, OutputFormat::Json);
837        assert!(formatted.text_out().is_empty());
838        assert!(formatted.data.is_none());
839    }
840
841    #[test]
842    fn estimated_byte_size_text_only_node() {
843        let node = OutputNode::text("hello world");
844        // Text-only node: name is empty, text is "hello world" (11 bytes)
845        assert_eq!(node.estimated_byte_size(), 11);
846    }
847
848    #[test]
849    fn estimated_byte_size_named_node() {
850        let node = OutputNode::new("file.txt");
851        assert_eq!(node.estimated_byte_size(), 8);
852    }
853
854    #[test]
855    fn write_canonical_respects_budget() {
856        let parent = OutputNode::new("root")
857            .with_children(vec![
858                OutputNode::new("aaaa"),
859                OutputNode::new("bbbb"),
860                OutputNode::new("cccc"),
861            ]);
862        // With a very small budget, should stop writing children early
863        let mut buf = Vec::new();
864        let written = parent.write_canonical(&mut buf, 8).unwrap();
865        let output = String::from_utf8(buf).unwrap();
866        // "root" (4) + "/{" (2) = 6, then budget check kicks in after first child
867        assert!(written <= 16, "should respect budget, wrote {} bytes: {}", written, output);
868        // Should at least write the root name
869        assert!(output.starts_with("root"), "should start with root: {}", output);
870    }
871
872    #[test]
873    fn into_text_simple() {
874        let data = OutputData::text("hello");
875        assert_eq!(data.into_text(), Ok("hello".to_string()));
876    }
877
878    #[test]
879    fn into_text_non_simple() {
880        let data = OutputData::nodes(vec![OutputNode::new("a"), OutputNode::new("b")]);
881        assert!(data.into_text().is_err());
882    }
883
884    #[test]
885    fn into_text_empty() {
886        let data = OutputData::text("");
887        assert_eq!(data.into_text(), Ok("".to_string()));
888    }
889}