harn_vm/orchestration/
nested_invocation.rs

1//! Capability-ceiling guard for nested Harn invocations.
2//!
3//! When a script that already runs under a parent execution policy
4//! launches another Harn invocation — `harn run`, `harn workflow run`,
5//! `harn supervisor fire/replay`, or a Burin harness — Harn must scan
6//! the target and reject anything that asks for *more* than the parent
7//! ceiling. This module hosts the scanner: it accepts a parent
8//! [`CapabilityPolicy`] plus a description of the nested target, and
9//! returns the list of dimensions where the target widens the parent.
10//!
11//! The scanner is deliberately conservative: when in doubt about what
12//! the target requests, it errs on the side of "ask for more" so the
13//! parent rejects rather than silently widens. It is the integration
14//! layer's job to wire this into the actual launch points (the `exec`,
15//! `shell`, `host_call` builtins, the workflow CLI, the supervisor
16//! API).
17
18use std::collections::BTreeSet;
19
20use serde::{Deserialize, Serialize};
21
22use super::workflow_bundle::WorkflowBundle;
23use super::workflow_patch::{bundle_capability_ceiling, CapabilityCeilingViolation};
24use super::CapabilityPolicy;
25
26/// One Harn invocation that could be launched from inside another.
27/// Each variant carries the data the scanner needs to project an
28/// effective requested ceiling.
29#[derive(Clone, Debug)]
30pub enum NestedInvocationTarget<'a> {
31    /// A `harn workflow run`-style invocation against a parsed bundle.
32    WorkflowBundle(&'a WorkflowBundle),
33    /// A `harn run`-style invocation against a Harn script source. The
34    /// scanner does a coarse string scan for builtins that require
35    /// elevated capabilities; that is enough to catch the obvious
36    /// widening attempts without forcing the AST into this layer.
37    HarnScript { path: &'a str, source: &'a str },
38    /// A Burin harness manifest. The scanner reads
39    /// `capability_ceiling` and `tools` if present, falling back to
40    /// "request everything" so the parent rejects unstructured
41    /// manifests rather than rubber-stamping them.
42    BurinHarness { manifest: &'a serde_json::Value },
43}
44
45#[derive(Clone, Debug, Default, Serialize, Deserialize, PartialEq, Eq)]
46pub struct NestedInvocationCeilingReport {
47    pub target_kind: String,
48    pub target_label: String,
49    pub parent: CapabilityPolicy,
50    pub requested: CapabilityPolicy,
51    pub violations: Vec<CapabilityCeilingViolation>,
52}
53
54impl NestedInvocationCeilingReport {
55    pub fn allowed(&self) -> bool {
56        self.violations.is_empty()
57    }
58}
59
60/// Compute the capability ceiling that running `target` would request
61/// of its parent runtime. This mirrors the projection used inside
62/// [`bundle_capability_ceiling`] so workflow bundles and standalone
63/// scripts share one comparison axis.
64pub fn requested_ceiling_for_target(target: &NestedInvocationTarget<'_>) -> CapabilityPolicy {
65    match target {
66        NestedInvocationTarget::WorkflowBundle(bundle) => bundle_capability_ceiling(bundle),
67        NestedInvocationTarget::HarnScript { source, .. } => scan_harn_script_ceiling(source),
68        NestedInvocationTarget::BurinHarness { manifest } => scan_burin_manifest_ceiling(manifest),
69    }
70}
71
72/// Enforce the parent ceiling against a nested invocation target.
73/// Returns a populated report; callers reject the launch if
74/// `report.allowed()` is false.
75pub fn enforce_nested_invocation_ceiling(
76    parent: &CapabilityPolicy,
77    target: &NestedInvocationTarget<'_>,
78) -> NestedInvocationCeilingReport {
79    let requested = requested_ceiling_for_target(target);
80    let violations = collect_violations(parent, &requested);
81    let (kind, label) = match target {
82        NestedInvocationTarget::WorkflowBundle(bundle) => {
83            ("workflow_bundle".to_string(), bundle.id.clone())
84        }
85        NestedInvocationTarget::HarnScript { path, .. } => {
86            ("harn_script".to_string(), path.to_string())
87        }
88        NestedInvocationTarget::BurinHarness { manifest } => {
89            let label = manifest
90                .get("id")
91                .and_then(|value| value.as_str())
92                .unwrap_or("<unknown>")
93                .to_string();
94            ("burin_harness".to_string(), label)
95        }
96    };
97    NestedInvocationCeilingReport {
98        target_kind: kind,
99        target_label: label,
100        parent: parent.clone(),
101        requested,
102        violations,
103    }
104}
105
106fn collect_violations(
107    parent: &CapabilityPolicy,
108    requested: &CapabilityPolicy,
109) -> Vec<CapabilityCeilingViolation> {
110    let mut violations = Vec::new();
111    if !parent.tools.is_empty() {
112        for tool in &requested.tools {
113            if !parent.tools.contains(tool) {
114                violations.push(CapabilityCeilingViolation {
115                    kind: "tool".to_string(),
116                    detail: format!("nested target requests tool '{tool}' outside parent ceiling"),
117                });
118            }
119        }
120    }
121    for (capability, ops) in &requested.capabilities {
122        match parent.capabilities.get(capability) {
123            Some(parent_ops) => {
124                for op in ops {
125                    if !parent_ops.contains(op) {
126                        violations.push(CapabilityCeilingViolation {
127                            kind: "capability".to_string(),
128                            detail: format!(
129                                "nested target requests '{capability}.{op}' outside parent ceiling"
130                            ),
131                        });
132                    }
133                }
134            }
135            None if !parent.capabilities.is_empty() => {
136                violations.push(CapabilityCeilingViolation {
137                    kind: "capability".to_string(),
138                    detail: format!(
139                        "nested target requests capability '{capability}' outside parent ceiling"
140                    ),
141                });
142            }
143            _ => {}
144        }
145    }
146    if let (Some(parent_level), Some(requested_level)) = (
147        parent.side_effect_level.as_deref(),
148        requested.side_effect_level.as_deref(),
149    ) {
150        if rank(requested_level) > rank(parent_level) {
151            violations.push(CapabilityCeilingViolation {
152                kind: "side_effect_level".to_string(),
153                detail: format!(
154                    "nested target requests side_effect_level '{requested_level}' outside parent ceiling '{parent_level}'"
155                ),
156            });
157        }
158    }
159    if !parent.workspace_roots.is_empty() {
160        for root in &requested.workspace_roots {
161            if !parent.workspace_roots.contains(root) {
162                violations.push(CapabilityCeilingViolation {
163                    kind: "workspace_root".to_string(),
164                    detail: format!(
165                        "nested target requests workspace_root '{root}' outside parent allowlist"
166                    ),
167                });
168            }
169        }
170    }
171    // A read-only root is in scope if the parent could read it — i.e. it
172    // is one of the parent's writable or read-only roots. The parent only
173    // bounds this dimension once it declares roots of either kind.
174    if !parent.workspace_roots.is_empty() || !parent.read_only_roots.is_empty() {
175        for root in &requested.read_only_roots {
176            if !parent.workspace_roots.contains(root) && !parent.read_only_roots.contains(root) {
177                violations.push(CapabilityCeilingViolation {
178                    kind: "read_only_root".to_string(),
179                    detail: format!(
180                        "nested target requests read_only_root '{root}' outside parent allowlist"
181                    ),
182                });
183            }
184        }
185    }
186    violations
187}
188
189fn rank(level: &str) -> usize {
190    match level {
191        "none" => 0,
192        "read_only" => 1,
193        "workspace_write" => 2,
194        "process_exec" => 3,
195        "network" => 4,
196        _ => 5,
197    }
198}
199
200/// Coarse capability projection for a Harn script source. We look for
201/// stdlib builtin tokens (`exec`, `shell`, `http_*`, `write_file`,
202/// `connector_call`, `llm_call`, etc.) and project an `(operation,
203/// side_effect_level)` set that the parent must allow. This is not
204/// type-aware — it intentionally over-includes rather than miss a
205/// widening attempt.
206fn scan_harn_script_ceiling(source: &str) -> CapabilityPolicy {
207    let stripped = strip_comments(source);
208    let mut capabilities: std::collections::BTreeMap<String, BTreeSet<String>> =
209        std::collections::BTreeMap::new();
210    let mut max_side_effect: Option<&'static str> = None;
211
212    for (token, capability, op, side_effect) in BUILTIN_CAPABILITIES {
213        if contains_call(&stripped, token) {
214            capabilities
215                .entry((*capability).to_string())
216                .or_default()
217                .insert((*op).to_string());
218            max_side_effect = match max_side_effect {
219                Some(current) if rank(current) >= rank(side_effect) => Some(current),
220                _ => Some(side_effect),
221            };
222        }
223    }
224
225    CapabilityPolicy {
226        tools: Vec::new(),
227        capabilities: capabilities
228            .into_iter()
229            .map(|(k, v)| (k, v.into_iter().collect()))
230            .collect(),
231        workspace_roots: Vec::new(),
232        read_only_roots: Vec::new(),
233        side_effect_level: max_side_effect.map(|level| level.to_string()),
234        recursion_limit: None,
235        tool_arg_constraints: Vec::new(),
236        tool_annotations: std::collections::BTreeMap::new(),
237        sandbox_profile: crate::orchestration::SandboxProfile::default(),
238        process_sandbox: Default::default(),
239    }
240}
241
242fn scan_burin_manifest_ceiling(manifest: &serde_json::Value) -> CapabilityPolicy {
243    if let Some(ceiling) = manifest.get("capability_ceiling") {
244        if let Ok(parsed) = serde_json::from_value::<CapabilityPolicy>(ceiling.clone()) {
245            return parsed;
246        }
247    }
248    let tools = manifest
249        .get("tools")
250        .and_then(|value| value.as_array())
251        .map(|tools| {
252            tools
253                .iter()
254                .filter_map(|tool| tool.as_str().map(str::to_string))
255                .collect::<Vec<_>>()
256        })
257        .unwrap_or_default();
258
259    CapabilityPolicy {
260        tools,
261        capabilities: std::collections::BTreeMap::new(),
262        workspace_roots: Vec::new(),
263        read_only_roots: Vec::new(),
264        side_effect_level: Some("network".to_string()),
265        recursion_limit: None,
266        tool_arg_constraints: Vec::new(),
267        tool_annotations: std::collections::BTreeMap::new(),
268        sandbox_profile: crate::orchestration::SandboxProfile::default(),
269        process_sandbox: Default::default(),
270    }
271}
272
273/// Strip line/block comments and the contents of string literals so the
274/// builtin scanner only sees actual source identifiers. Quoted text is
275/// replaced with whitespace of the same length to keep byte offsets and
276/// line numbers stable for any future diagnostics.
277fn strip_comments(source: &str) -> String {
278    let mut out = String::with_capacity(source.len());
279    let mut in_block = false;
280    let mut chars = source.chars().peekable();
281    while let Some(c) = chars.next() {
282        if in_block {
283            if c == '*' && matches!(chars.peek(), Some('/')) {
284                chars.next();
285                in_block = false;
286            }
287            continue;
288        }
289        if c == '/' {
290            match chars.peek() {
291                Some('/') => {
292                    for next in chars.by_ref() {
293                        if next == '\n' {
294                            out.push('\n');
295                            break;
296                        }
297                    }
298                    continue;
299                }
300                Some('*') => {
301                    chars.next();
302                    in_block = true;
303                    continue;
304                }
305                _ => {}
306            }
307        }
308        if c == '#' {
309            for next in chars.by_ref() {
310                if next == '\n' {
311                    out.push('\n');
312                    break;
313                }
314            }
315            continue;
316        }
317        if c == '"' || c == '\'' {
318            out.push(' ');
319            let quote = c;
320            while let Some(next) = chars.next() {
321                if next == '\\' {
322                    chars.next();
323                    out.push(' ');
324                    out.push(' ');
325                    continue;
326                }
327                if next == quote {
328                    out.push(' ');
329                    break;
330                }
331                out.push(if next == '\n' { '\n' } else { ' ' });
332            }
333            continue;
334        }
335        out.push(c);
336    }
337    out
338}
339
340fn contains_call(source: &str, token: &str) -> bool {
341    let bytes = source.as_bytes();
342    let needle = token.as_bytes();
343    if bytes.len() < needle.len() + 1 {
344        return false;
345    }
346    let mut start = 0;
347    while let Some(pos) = find_subslice(&bytes[start..], needle) {
348        let absolute = start + pos;
349        let before = if absolute == 0 {
350            None
351        } else {
352            Some(bytes[absolute - 1])
353        };
354        let after = bytes.get(absolute + needle.len()).copied();
355        let valid_before = match before {
356            None => true,
357            Some(c) => !is_identifier_byte(c),
358        };
359        let valid_after = matches!(after, Some(b'(') | Some(b' ') | Some(b'\t'))
360            || matches!(after, Some(b'\n') | Some(b'\r'));
361        if valid_before && valid_after {
362            return true;
363        }
364        start = absolute + needle.len();
365    }
366    false
367}
368
369fn find_subslice(haystack: &[u8], needle: &[u8]) -> Option<usize> {
370    if needle.is_empty() || haystack.len() < needle.len() {
371        return None;
372    }
373    haystack
374        .windows(needle.len())
375        .position(|window| window == needle)
376}
377
378fn is_identifier_byte(b: u8) -> bool {
379    b.is_ascii_alphanumeric() || b == b'_'
380}
381
382const BUILTIN_CAPABILITIES: &[(&str, &str, &str, &str)] = &[
383    ("read_file", "workspace", "read_text", "read_only"),
384    ("read_file_result", "workspace", "read_text", "read_only"),
385    ("read_file_bytes", "workspace", "read_text", "read_only"),
386    ("render", "workspace", "read_text", "read_only"),
387    ("render_prompt", "workspace", "read_text", "read_only"),
388    (
389        "render_with_provenance",
390        "workspace",
391        "read_text",
392        "read_only",
393    ),
394    ("list_dir", "workspace", "list", "read_only"),
395    ("file_exists", "workspace", "exists", "read_only"),
396    ("stat", "workspace", "exists", "read_only"),
397    ("write_file", "workspace", "write_text", "workspace_write"),
398    (
399        "write_file_bytes",
400        "workspace",
401        "write_text",
402        "workspace_write",
403    ),
404    ("append_file", "workspace", "write_text", "workspace_write"),
405    ("mkdir", "workspace", "write_text", "workspace_write"),
406    ("copy_file", "workspace", "write_text", "workspace_write"),
407    ("delete_file", "workspace", "delete", "workspace_write"),
408    ("apply_edit", "workspace", "apply_edit", "workspace_write"),
409    ("exec", "process", "exec", "process_exec"),
410    ("exec_at", "process", "exec", "process_exec"),
411    ("shell", "process", "exec", "process_exec"),
412    ("shell_at", "process", "exec", "process_exec"),
413    ("http_get", "network", "http", "network"),
414    ("http_post", "network", "http", "network"),
415    ("http_put", "network", "http", "network"),
416    ("http_patch", "network", "http", "network"),
417    ("http_delete", "network", "http", "network"),
418    ("http_request", "network", "http", "network"),
419    ("http_download", "network", "http", "network"),
420    ("connector_call", "connector", "call", "network"),
421    ("secret_get", "connector", "secret_get", "read_only"),
422    ("llm_call", "llm", "call", "network"),
423    ("llm_call_safe", "llm", "call", "network"),
424    ("llm_completion", "llm", "call", "network"),
425    ("llm_stream", "llm", "call", "network"),
426    ("agent_loop", "llm", "call", "network"),
427    ("vision_ocr", "vision", "ocr", "process_exec"),
428    ("mcp_call", "process", "exec", "process_exec"),
429    ("mcp_connect", "process", "exec", "process_exec"),
430];
431
432#[cfg(test)]
433mod tests {
434    use super::*;
435    use std::collections::BTreeMap;
436
437    fn permissive_parent() -> CapabilityPolicy {
438        let mut capabilities = BTreeMap::new();
439        capabilities.insert(
440            "workspace".to_string(),
441            vec!["read_text".to_string(), "list".to_string()],
442        );
443        capabilities.insert("connector".to_string(), vec!["call".to_string()]);
444        capabilities.insert("process".to_string(), vec!["exec".to_string()]);
445        capabilities.insert("network".to_string(), vec!["http".to_string()]);
446        capabilities.insert("llm".to_string(), vec!["call".to_string()]);
447        CapabilityPolicy {
448            tools: Vec::new(),
449            capabilities,
450            workspace_roots: Vec::new(),
451            read_only_roots: Vec::new(),
452            side_effect_level: Some("network".to_string()),
453            recursion_limit: None,
454            tool_arg_constraints: Vec::new(),
455            tool_annotations: BTreeMap::new(),
456            sandbox_profile: crate::orchestration::SandboxProfile::default(),
457            process_sandbox: Default::default(),
458        }
459    }
460
461    fn read_only_parent() -> CapabilityPolicy {
462        let mut capabilities = BTreeMap::new();
463        capabilities.insert(
464            "workspace".to_string(),
465            vec![
466                "read_text".to_string(),
467                "list".to_string(),
468                "exists".to_string(),
469            ],
470        );
471        CapabilityPolicy {
472            tools: Vec::new(),
473            capabilities,
474            workspace_roots: Vec::new(),
475            read_only_roots: Vec::new(),
476            side_effect_level: Some("read_only".to_string()),
477            recursion_limit: None,
478            tool_arg_constraints: Vec::new(),
479            tool_annotations: BTreeMap::new(),
480            sandbox_profile: crate::orchestration::SandboxProfile::default(),
481            process_sandbox: Default::default(),
482        }
483    }
484
485    #[test]
486    fn harn_script_with_only_reads_passes_under_read_only_parent() {
487        let source = r#"
488            let body = read_file("README.md")
489            let exists = file_exists("Cargo.toml")
490        "#;
491        let report = enforce_nested_invocation_ceiling(
492            &read_only_parent(),
493            &NestedInvocationTarget::HarnScript {
494                path: "test.harn",
495                source,
496            },
497        );
498        assert!(report.allowed(), "{report:#?}");
499    }
500
501    #[test]
502    fn harn_script_with_exec_is_rejected_under_read_only_parent() {
503        let source = r#"
504            let result = exec("ls", ["-la"])
505        "#;
506        let report = enforce_nested_invocation_ceiling(
507            &read_only_parent(),
508            &NestedInvocationTarget::HarnScript {
509                path: "exec.harn",
510                source,
511            },
512        );
513        assert!(!report.allowed());
514        let kinds: Vec<&str> = report.violations.iter().map(|v| v.kind.as_str()).collect();
515        assert!(kinds.contains(&"capability"));
516        assert!(kinds.contains(&"side_effect_level"));
517    }
518
519    #[test]
520    fn harn_script_with_http_is_rejected_under_read_only_parent() {
521        let source = r#"
522            http_get("https://example.com")
523        "#;
524        let report = enforce_nested_invocation_ceiling(
525            &read_only_parent(),
526            &NestedInvocationTarget::HarnScript {
527                path: "http.harn",
528                source,
529            },
530        );
531        assert!(!report.allowed());
532    }
533
534    #[test]
535    fn harn_script_with_vision_ocr_is_rejected_under_read_only_parent() {
536        let source = r#"
537            vision_ocr("receipt.png")
538        "#;
539        let report = enforce_nested_invocation_ceiling(
540            &read_only_parent(),
541            &NestedInvocationTarget::HarnScript {
542                path: "vision.harn",
543                source,
544            },
545        );
546        assert!(!report.allowed());
547        let kinds: Vec<&str> = report.violations.iter().map(|v| v.kind.as_str()).collect();
548        assert!(kinds.contains(&"capability"));
549        assert!(kinds.contains(&"side_effect_level"));
550    }
551
552    #[test]
553    fn harn_script_keyword_inside_string_does_not_trigger() {
554        let source = r#"
555            let label = "exec is not invoked here"
556            let body = read_file("README.md")
557        "#;
558        let report = enforce_nested_invocation_ceiling(
559            &read_only_parent(),
560            &NestedInvocationTarget::HarnScript {
561                path: "string.harn",
562                source,
563            },
564        );
565        assert!(
566            report.allowed(),
567            "false positive on quoted token: {report:#?}"
568        );
569    }
570
571    #[test]
572    fn harn_script_keyword_in_comment_is_ignored() {
573        let source = r#"
574            // exec("rm -rf /") is what we used to do but no longer
575            let x = read_file("README.md")
576        "#;
577        let report = enforce_nested_invocation_ceiling(
578            &read_only_parent(),
579            &NestedInvocationTarget::HarnScript {
580                path: "comments.harn",
581                source,
582            },
583        );
584        assert!(
585            report.allowed(),
586            "false positive on commented token: {report:#?}"
587        );
588    }
589
590    #[test]
591    fn workflow_bundle_with_act_auto_is_rejected_under_read_only_parent() {
592        let mut bundle = super::super::workflow_test_fixtures::pr_monitor_bundle();
593        bundle.policy.autonomy_tier = "act_auto".to_string();
594        let report = enforce_nested_invocation_ceiling(
595            &read_only_parent(),
596            &NestedInvocationTarget::WorkflowBundle(&bundle),
597        );
598        assert!(!report.allowed());
599    }
600
601    #[test]
602    fn burin_manifest_with_explicit_ceiling_is_used_directly() {
603        let manifest = serde_json::json!({
604            "id": "burin.harness.repair",
605            "capability_ceiling": {
606                "capabilities": {
607                    "workspace": ["read_text"]
608                },
609                "side_effect_level": "read_only"
610            }
611        });
612        let report = enforce_nested_invocation_ceiling(
613            &read_only_parent(),
614            &NestedInvocationTarget::BurinHarness {
615                manifest: &manifest,
616            },
617        );
618        assert!(report.allowed(), "{report:#?}");
619    }
620
621    #[test]
622    fn burin_manifest_without_ceiling_falls_back_to_network_and_is_rejected() {
623        let manifest = serde_json::json!({"id": "burin.harness.unknown"});
624        let report = enforce_nested_invocation_ceiling(
625            &read_only_parent(),
626            &NestedInvocationTarget::BurinHarness {
627                manifest: &manifest,
628            },
629        );
630        assert!(!report.allowed());
631    }
632
633    #[test]
634    fn permissive_parent_accepts_workflow_bundle() {
635        let bundle = super::super::workflow_test_fixtures::pr_monitor_bundle();
636        let report = enforce_nested_invocation_ceiling(
637            &permissive_parent(),
638            &NestedInvocationTarget::WorkflowBundle(&bundle),
639        );
640        assert!(report.allowed(), "{report:#?}");
641    }
642}
harn_vm/orchestration/nested_invocation.rs

harn_vm/orchestration/
nested_invocation.rs