Skip to main content

harn_vm/stdlib/
hitl.rs

1use crate::value::VmDictExt;
2use std::cell::RefCell;
3use std::collections::{BTreeMap, BTreeSet};
4use std::path::Path;
5use std::sync::Arc;
6use std::time::Duration as StdDuration;
7
8use serde::{Deserialize, Serialize};
9use serde_json::{json, Value as JsonValue};
10use sha2::Digest;
11use time::format_description::well_known::Rfc3339;
12use time::OffsetDateTime;
13use uuid::Uuid;
14
15use crate::event_log::{
16    active_event_log, install_default_for_base_dir, install_memory_for_current_thread, AnyEventLog,
17    EventLog, LogEvent, Topic,
18};
19use crate::runtime_limits::RuntimeLimits;
20use crate::schema::schema_expect_value;
21use crate::stdlib::host::dispatch_mock_host_call;
22use crate::stdlib::macros::{harn_builtin, BuiltinSignature, Param, VmBuiltinDef, TY_ANY, TY_DICT};
23use crate::stdlib::options::{duration_from_value, ErrorKind};
24use crate::stdlib::waitpoint::{
25    cancel_waitpoint_on, complete_waitpoint_on, create_waitpoint_on, inspect_waitpoint_on,
26    wait_on_waitpoints, WaitpointRecord, WaitpointStatus, WaitpointWaitFailure,
27    WaitpointWaitOptions,
28};
29use crate::triggers::dispatcher::current_dispatch_context;
30use crate::value::{categorized_error, ErrorCategory, VmError, VmValue};
31use crate::vm::{AsyncBuiltinCtx, Vm};
32
33const HITL_EVENT_LOG_QUEUE_DEPTH: usize = RuntimeLimits::DEFAULT.default_event_log_queue_depth;
34const HITL_APPROVAL_TIMEOUT_MS: u64 = 24 * 60 * 60 * 1000;
35const HITL_QUESTION_TIMEOUT_MS: u64 = 24 * 60 * 60 * 1000;
36
37pub const HITL_QUESTIONS_TOPIC: &str = "hitl.questions";
38pub const HITL_APPROVALS_TOPIC: &str = "hitl.approvals";
39pub const HITL_DUAL_CONTROL_TOPIC: &str = "hitl.dual_control";
40pub const HITL_ESCALATIONS_TOPIC: &str = "hitl.escalations";
41
42thread_local! {
43    static REQUEST_SEQUENCE: RefCell<RequestSequenceState> = RefCell::new(RequestSequenceState::default());
44}
45
46#[derive(Default)]
47pub(crate) struct RequestSequenceState {
48    pub(crate) instance_key: String,
49    pub(crate) next_seq: u64,
50}
51
52#[derive(Clone, Copy, Debug, PartialEq, Eq, Serialize, Deserialize)]
53#[serde(rename_all = "snake_case")]
54pub enum HitlRequestKind {
55    Question,
56    Approval,
57    DualControl,
58    Escalation,
59}
60
61impl HitlRequestKind {
62    pub(crate) fn as_str(self) -> &'static str {
63        match self {
64            Self::Question => "question",
65            Self::Approval => "approval",
66            Self::DualControl => "dual_control",
67            Self::Escalation => "escalation",
68        }
69    }
70
71    fn topic(self) -> &'static str {
72        match self {
73            Self::Question => HITL_QUESTIONS_TOPIC,
74            Self::Approval => HITL_APPROVALS_TOPIC,
75            Self::DualControl => HITL_DUAL_CONTROL_TOPIC,
76            Self::Escalation => HITL_ESCALATIONS_TOPIC,
77        }
78    }
79
80    fn request_event_kind(self) -> &'static str {
81        match self {
82            Self::Question => "hitl.question_asked",
83            Self::Approval => "hitl.approval_requested",
84            Self::DualControl => "hitl.dual_control_requested",
85            Self::Escalation => "hitl.escalation_issued",
86        }
87    }
88
89    pub(crate) fn from_request_id(request_id: &str) -> Option<Self> {
90        if request_id.starts_with("hitl_question_") {
91            Some(Self::Question)
92        } else if request_id.starts_with("hitl_approval_") {
93            Some(Self::Approval)
94        } else if request_id.starts_with("hitl_dual_control_") {
95            Some(Self::DualControl)
96        } else if request_id.starts_with("hitl_escalation_") {
97            Some(Self::Escalation)
98        } else {
99            None
100        }
101    }
102}
103
104#[derive(Clone, Debug, Serialize, Deserialize)]
105pub struct HitlHostResponse {
106    pub request_id: String,
107    #[serde(skip_serializing_if = "Option::is_none")]
108    pub answer: Option<JsonValue>,
109    #[serde(skip_serializing_if = "Option::is_none")]
110    pub approved: Option<bool>,
111    #[serde(skip_serializing_if = "Option::is_none")]
112    pub accepted: Option<bool>,
113    #[serde(skip_serializing_if = "Option::is_none")]
114    pub reviewer: Option<String>,
115    #[serde(skip_serializing_if = "Option::is_none")]
116    pub reason: Option<String>,
117    #[serde(skip_serializing_if = "Option::is_none")]
118    pub metadata: Option<JsonValue>,
119    #[serde(skip_serializing_if = "Option::is_none")]
120    pub responded_at: Option<String>,
121    #[serde(skip_serializing_if = "Option::is_none")]
122    pub signature: Option<String>,
123}
124
125#[derive(Clone, Debug, Serialize, Deserialize)]
126struct HitlRequestEnvelope {
127    request_id: String,
128    kind: HitlRequestKind,
129    #[serde(default)]
130    agent: String,
131    trace_id: String,
132    #[serde(skip_serializing_if = "Option::is_none")]
133    run_id: Option<String>,
134    requested_at: String,
135    payload: JsonValue,
136}
137
138#[derive(Clone, Debug, Serialize, Deserialize)]
139struct HitlTimeoutRecord {
140    request_id: String,
141    kind: HitlRequestKind,
142    trace_id: String,
143    timed_out_at: String,
144}
145
146#[derive(Clone, Debug, Serialize, Deserialize, PartialEq, Eq)]
147pub struct ApprovalRequest {
148    pub id: String,
149    pub action: String,
150    #[serde(default)]
151    pub args: JsonValue,
152    pub principal: String,
153    pub requested_at: String,
154    #[serde(skip_serializing_if = "Option::is_none")]
155    pub deadline: Option<String>,
156    pub approvers_required: u32,
157    #[serde(default)]
158    pub evidence_refs: Vec<JsonValue>,
159    #[serde(default)]
160    pub undo_metadata: JsonValue,
161    #[serde(default)]
162    pub capabilities_requested: Vec<String>,
163}
164
165impl ApprovalRequest {
166    pub fn new(
167        id: impl Into<String>,
168        action: impl Into<String>,
169        args: JsonValue,
170        principal: impl Into<String>,
171        requested_at: impl Into<String>,
172    ) -> Self {
173        Self {
174            id: id.into(),
175            action: action.into(),
176            args,
177            principal: principal.into(),
178            requested_at: requested_at.into(),
179            deadline: None,
180            approvers_required: 1,
181            evidence_refs: Vec::new(),
182            undo_metadata: JsonValue::Null,
183            capabilities_requested: Vec::new(),
184        }
185    }
186}
187
188pub(crate) fn approval_request_for_host_permission(
189    id: impl Into<String>,
190    action: impl Into<String>,
191    args: JsonValue,
192    principal: impl Into<String>,
193    evidence_refs: Vec<JsonValue>,
194    undo_metadata: JsonValue,
195    capabilities_requested: Vec<String>,
196) -> ApprovalRequest {
197    let mut request = ApprovalRequest::new(id, action, args, principal, now_rfc3339());
198    request.evidence_refs = evidence_refs;
199    request.undo_metadata = undo_metadata;
200    request.capabilities_requested = capabilities_requested;
201    request
202}
203
204#[derive(Clone, Debug)]
205struct DispatchKeys {
206    instance_key: String,
207    stable_base: String,
208    agent: String,
209    trace_id: String,
210}
211
212#[derive(Clone, Debug)]
213struct AskUserOptions {
214    schema: Option<VmValue>,
215    timeout: Option<StdDuration>,
216    default: Option<VmValue>,
217}
218
219#[derive(Clone, Debug)]
220struct ApprovalOptions {
221    detail: Option<VmValue>,
222    args: Option<VmValue>,
223    quorum: u32,
224    reviewers: Vec<String>,
225    deadline: StdDuration,
226    principal: Option<String>,
227    evidence_refs: Vec<JsonValue>,
228    undo_metadata: Option<JsonValue>,
229    capabilities_requested: Vec<String>,
230}
231
232#[derive(Clone, Debug)]
233struct ApprovalProgress {
234    request_id: String,
235    reviewers: BTreeSet<String>,
236    signatures: Vec<ApprovalSignature>,
237    reason: Option<String>,
238    approved_at: Option<String>,
239}
240
241#[derive(Clone, Debug, Serialize)]
242struct ApprovalSignature {
243    reviewer: String,
244    signed_at: String,
245    signature: String,
246}
247
248#[derive(Clone, Debug)]
249enum ApprovalResolution {
250    Pending,
251    Approved(ApprovalProgress),
252    Denied(HitlHostResponse),
253}
254
255// `Completed` carries the full `WaitpointRecord`, which dominates the
256// enum's size — boxing it would force every match arm to indirect even
257// though the enum is dropped within nanoseconds of being constructed
258// (it's a local return type for the waitpoint poll loop, never stored).
259// Surfaced by the host-target compile of `harn-vm` introduced when
260// `harn-cli`'s build script gained `harn-vm` as a build-dep for the
261// AOT bytecode embedding pass (G7 / harn#2300).
262#[allow(clippy::large_enum_variant)]
263#[derive(Clone, Debug)]
264enum WaitpointOutcome {
265    Completed(WaitpointRecord),
266    Timeout,
267    Cancelled {
268        wait_id: String,
269        waitpoint_ids: Vec<String>,
270        reason: Option<String>,
271    },
272}
273
274pub(crate) fn register_hitl_builtins(vm: &mut Vm) {
275    for def in MODULE_BUILTINS {
276        vm.register_builtin_def(def);
277    }
278}
279
280pub(crate) const MODULE_BUILTINS: &[&VmBuiltinDef] = &[
281    &ASK_USER_BUILTIN_DEF,
282    &REQUEST_APPROVAL_BUILTIN_DEF,
283    &DUAL_CONTROL_BUILTIN_DEF,
284    &ESCALATE_TO_BUILTIN_DEF,
285];
286
287#[harn_builtin(
288    sig = "ask_user(prompt: string, options?: dict) -> any",
289    kind = "async",
290    category = "hitl"
291)]
292async fn ask_user_builtin(
293    ctx: crate::vm::AsyncBuiltinCtx,
294    args: Vec<VmValue>,
295) -> Result<VmValue, VmError> {
296    ask_user_impl(Some(&ctx), &args).await
297}
298
299#[harn_builtin(
300    sig_expr = BuiltinSignature::variadic("request_approval", &[Param::new("args", TY_ANY)], TY_DICT),
301    kind = "async",
302    category = "hitl"
303)]
304async fn request_approval_builtin(
305    ctx: crate::vm::AsyncBuiltinCtx,
306    args: Vec<VmValue>,
307) -> Result<VmValue, VmError> {
308    request_approval_impl(Some(&ctx), &args).await
309}
310
311#[harn_builtin(
312    sig = "dual_control(n: int, m: int, action: closure, approvers?: list) -> dict",
313    kind = "async",
314    category = "hitl"
315)]
316async fn dual_control_builtin(
317    ctx: crate::vm::AsyncBuiltinCtx,
318    args: Vec<VmValue>,
319) -> Result<VmValue, VmError> {
320    dual_control_impl(&ctx, &args).await
321}
322
323#[harn_builtin(
324    sig = "escalate_to(role: string, reason: string) -> dict",
325    kind = "async",
326    category = "hitl"
327)]
328async fn escalate_to_builtin(
329    ctx: crate::vm::AsyncBuiltinCtx,
330    args: Vec<VmValue>,
331) -> Result<VmValue, VmError> {
332    escalate_to_impl(Some(&ctx), &args).await
333}
334
335pub(crate) fn reset_hitl_state() {
336    REQUEST_SEQUENCE.with(|slot| {
337        *slot.borrow_mut() = RequestSequenceState::default();
338    });
339}
340
341pub(crate) fn take_hitl_state() -> RequestSequenceState {
342    REQUEST_SEQUENCE.with(|slot| std::mem::take(&mut *slot.borrow_mut()))
343}
344
345pub(crate) fn restore_hitl_state(state: RequestSequenceState) {
346    REQUEST_SEQUENCE.with(|slot| {
347        *slot.borrow_mut() = state;
348    });
349}
350
351pub async fn append_hitl_response(
352    base_dir: Option<&Path>,
353    mut response: HitlHostResponse,
354) -> Result<u64, String> {
355    let kind = HitlRequestKind::from_request_id(&response.request_id)
356        .ok_or_else(|| format!("unknown HITL request id '{}'", response.request_id))?;
357    if response.responded_at.is_none() {
358        response.responded_at = Some(now_rfc3339());
359    }
360    let log = ensure_hitl_event_log_for(base_dir)?;
361    let headers = response_headers(&response.request_id);
362    let topic = Topic::new(kind.topic()).map_err(|error| error.to_string())?;
363    let event_id = log
364        .append(
365            &topic,
366            LogEvent::new(
367                match kind {
368                    HitlRequestKind::Escalation => "hitl.escalation_accepted",
369                    _ => "hitl.response_received",
370                },
371                serde_json::to_value(&response).map_err(|error| error.to_string())?,
372            )
373            .with_headers(headers),
374        )
375        .await
376        .map_err(|error| error.to_string())?;
377    finalize_hitl_response(&log, kind, &response).await?;
378    Ok(event_id)
379}
380
381pub async fn append_approval_request_on(
382    log: &Arc<AnyEventLog>,
383    agent: impl Into<String>,
384    trace_id: impl Into<String>,
385    action: impl Into<String>,
386    detail: JsonValue,
387    reviewers: Vec<String>,
388) -> Result<String, VmError> {
389    let request_id = next_request_id(HitlRequestKind::Approval, current_dispatch_keys().as_ref());
390    let trace_id = trace_id.into();
391    let agent = agent.into();
392    let requested_at_time = OffsetDateTime::now_utc();
393    let requested_at = format_rfc3339(requested_at_time);
394    let mut approval_request = ApprovalRequest::new(
395        request_id.clone(),
396        action.into(),
397        detail.clone(),
398        agent.clone(),
399        requested_at.clone(),
400    );
401    approval_request.deadline = deadline_after(
402        requested_at_time,
403        StdDuration::from_millis(HITL_APPROVAL_TIMEOUT_MS),
404    );
405    approval_request.approvers_required = 1;
406    let approval_request_json = serde_json::to_value(&approval_request)
407        .map_err(|error| VmError::Runtime(error.to_string()))?;
408    let request = HitlRequestEnvelope {
409        request_id: request_id.clone(),
410        kind: HitlRequestKind::Approval,
411        agent,
412        trace_id: trace_id.clone(),
413        run_id: None,
414        requested_at: requested_at.clone(),
415        payload: json!({
416            "approval_request": approval_request_json,
417            "id": approval_request.id,
418            "action": approval_request.action,
419            "args": approval_request.args,
420            "principal": approval_request.principal,
421            "requested_at": requested_at,
422            "deadline": approval_request.deadline,
423            "approvers_required": approval_request.approvers_required,
424            "evidence_refs": approval_request.evidence_refs,
425            "undo_metadata": approval_request.undo_metadata,
426            "capabilities_requested": approval_request.capabilities_requested,
427            "detail": detail,
428            "quorum": 1,
429            "reviewers": reviewers,
430            "deadline_ms": HITL_APPROVAL_TIMEOUT_MS,
431        }),
432    };
433    create_request_waitpoint(log, &request).await?;
434    append_request(log, &request).await?;
435    maybe_notify_host(None, &request);
436    Ok(request_id)
437}
438
439async fn ask_user_impl(
440    ctx: Option<&AsyncBuiltinCtx>,
441    args: &[VmValue],
442) -> Result<VmValue, VmError> {
443    let prompt = required_string_arg(args, 0, "ask_user")?;
444    let options = parse_ask_user_options(args.get(1))?;
445    let keys = current_dispatch_keys();
446    let request_id = next_request_id(HitlRequestKind::Question, keys.as_ref());
447    let trace_id = keys
448        .as_ref()
449        .map(|keys| keys.trace_id.clone())
450        .unwrap_or_else(new_trace_id);
451    let log = ensure_hitl_event_log();
452    let request = HitlRequestEnvelope {
453        request_id: request_id.clone(),
454        kind: HitlRequestKind::Question,
455        agent: keys
456            .as_ref()
457            .map(|keys| keys.agent.clone())
458            .unwrap_or_default(),
459        trace_id: trace_id.clone(),
460        run_id: crate::orchestration::current_mutation_session().and_then(|session| session.run_id),
461        requested_at: now_rfc3339(),
462        payload: json!({
463            "prompt": prompt,
464            "schema": options.schema.as_ref().map(crate::llm::vm_value_to_json),
465            "default": options.default.as_ref().map(crate::llm::vm_value_to_json),
466            "timeout_ms": options.timeout.map(|timeout| timeout.as_millis() as u64),
467        }),
468    };
469    create_request_waitpoint(&log, &request).await?;
470    append_request(&log, &request).await?;
471    maybe_notify_host(ctx, &request);
472    emit_hitl_requested(&request);
473    maybe_apply_mock_response(HitlRequestKind::Question, &request_id, &request.payload).await?;
474
475    match wait_for_request_waitpoint_with_events(
476        &request_id,
477        HitlRequestKind::Question,
478        options.timeout,
479    )
480    .await?
481    {
482        WaitpointOutcome::Completed(record) => {
483            let answer = record
484                .value
485                .as_ref()
486                .map(crate::stdlib::json_to_vm_value)
487                .unwrap_or(VmValue::Nil);
488            if let Some(schema) = options.schema.as_ref() {
489                return schema_expect_value(&answer, schema, true);
490            }
491            if let Some(default) = options.default.as_ref() {
492                return Ok(coerce_like_default(&answer, default));
493            }
494            Ok(answer)
495        }
496        WaitpointOutcome::Timeout => {
497            append_timeout_once(&log, HitlRequestKind::Question, &request_id, &trace_id).await?;
498            if let Some(default) = options.default {
499                return Ok(default);
500            }
501            Err(timeout_error(&request_id, HitlRequestKind::Question))
502        }
503        WaitpointOutcome::Cancelled {
504            wait_id,
505            waitpoint_ids,
506            reason,
507        } => Err(hitl_cancelled_error(
508            &request_id,
509            HitlRequestKind::Question,
510            &wait_id,
511            &waitpoint_ids,
512            reason,
513        )),
514    }
515}
516
517async fn request_approval_impl(
518    ctx: Option<&AsyncBuiltinCtx>,
519    args: &[VmValue],
520) -> Result<VmValue, VmError> {
521    let action = required_string_arg(args, 0, "request_approval")?;
522    let options = parse_approval_options(args.get(1), "request_approval")?;
523    let keys = current_dispatch_keys();
524    let request_id = next_request_id(HitlRequestKind::Approval, keys.as_ref());
525    let trace_id = keys
526        .as_ref()
527        .map(|keys| keys.trace_id.clone())
528        .unwrap_or_else(new_trace_id);
529    let agent = keys
530        .as_ref()
531        .map(|keys| keys.agent.clone())
532        .unwrap_or_default();
533    let requested_at_time = OffsetDateTime::now_utc();
534    let requested_at = format_rfc3339(requested_at_time);
535    let principal = options.principal.clone().unwrap_or_else(|| agent.clone());
536    let approval_args = options
537        .args
538        .as_ref()
539        .or(options.detail.as_ref())
540        .map(crate::llm::vm_value_to_json)
541        .unwrap_or(JsonValue::Null);
542    let mut approval_request = ApprovalRequest::new(
543        request_id.clone(),
544        action.clone(),
545        approval_args,
546        principal,
547        requested_at.clone(),
548    );
549    approval_request.deadline = deadline_after(requested_at_time, options.deadline);
550    approval_request.approvers_required = options.quorum;
551    approval_request.evidence_refs = options.evidence_refs.clone();
552    approval_request.undo_metadata = options
553        .undo_metadata
554        .clone()
555        .or_else(|| {
556            crate::orchestration::current_mutation_session()
557                .and_then(|session| serde_json::to_value(session).ok())
558        })
559        .unwrap_or(JsonValue::Null);
560    approval_request.capabilities_requested = options.capabilities_requested.clone();
561    let approval_request_json = serde_json::to_value(&approval_request)
562        .map_err(|error| VmError::Runtime(error.to_string()))?;
563    let log = ensure_hitl_event_log();
564    let request = HitlRequestEnvelope {
565        request_id: request_id.clone(),
566        kind: HitlRequestKind::Approval,
567        agent,
568        trace_id: trace_id.clone(),
569        run_id: crate::orchestration::current_mutation_session().and_then(|session| session.run_id),
570        requested_at: requested_at.clone(),
571        payload: json!({
572            "approval_request": approval_request_json,
573            "id": approval_request.id,
574            "action": action,
575            "args": approval_request.args,
576            "principal": approval_request.principal,
577            "requested_at": requested_at,
578            "deadline": approval_request.deadline,
579            "approvers_required": approval_request.approvers_required,
580            "evidence_refs": approval_request.evidence_refs,
581            "undo_metadata": approval_request.undo_metadata,
582            "capabilities_requested": approval_request.capabilities_requested,
583            "detail": options.detail.as_ref().map(crate::llm::vm_value_to_json),
584            "quorum": options.quorum,
585            "reviewers": options.reviewers,
586            "deadline_ms": options.deadline.as_millis() as u64,
587        }),
588    };
589    create_request_waitpoint(&log, &request).await?;
590    append_request(&log, &request).await?;
591    maybe_notify_host(ctx, &request);
592    emit_hitl_requested(&request);
593    maybe_apply_mock_response(HitlRequestKind::Approval, &request_id, &request.payload).await?;
594
595    match wait_for_request_waitpoint_with_events(
596        &request_id,
597        HitlRequestKind::Approval,
598        Some(options.deadline),
599    )
600    .await?
601    {
602        WaitpointOutcome::Completed(record) => {
603            approval_record_from_waitpoint(&record, "request_approval")
604        }
605        WaitpointOutcome::Timeout => {
606            append_timeout_once(&log, HitlRequestKind::Approval, &request_id, &trace_id).await?;
607            Err(timeout_error(&request_id, HitlRequestKind::Approval))
608        }
609        WaitpointOutcome::Cancelled { .. } => {
610            Err(approval_wait_error(&log, HitlRequestKind::Approval, &request_id).await)
611        }
612    }
613}
614
615pub(crate) async fn request_approval_for_side_effect(
616    action: &str,
617    detail: JsonValue,
618    principal: String,
619    reviewers: Vec<String>,
620    capabilities_requested: Vec<String>,
621) -> Result<VmValue, VmError> {
622    let mut options = crate::value::DictMap::new();
623    options.insert("args".to_string(), crate::stdlib::json_to_vm_value(&detail));
624    options.insert(
625        "detail".to_string(),
626        crate::stdlib::json_to_vm_value(&detail),
627    );
628    options.put_str("principal", principal);
629    options.insert(
630        "reviewers".to_string(),
631        VmValue::List(std::sync::Arc::new(
632            reviewers
633                .into_iter()
634                .map(|reviewer| VmValue::String(std::sync::Arc::from(reviewer)))
635                .collect(),
636        )),
637    );
638    options.insert(
639        "capabilities_requested".to_string(),
640        VmValue::List(std::sync::Arc::new(
641            capabilities_requested
642                .into_iter()
643                .map(|capability| VmValue::String(std::sync::Arc::from(capability)))
644                .collect(),
645        )),
646    );
647    let args = vec![
648        VmValue::String(std::sync::Arc::from(action.to_string())),
649        VmValue::dict(options),
650    ];
651    request_approval_impl(None, &args).await
652}
653
654async fn dual_control_impl(ctx: &AsyncBuiltinCtx, args: &[VmValue]) -> Result<VmValue, VmError> {
655    let n = required_positive_int_arg(args, 0, "dual_control")?;
656    let m = required_positive_int_arg(args, 1, "dual_control")?;
657    if n > m {
658        return Err(VmError::Runtime(
659            "dual_control: n must be less than or equal to m".to_string(),
660        ));
661    }
662    let action = args
663        .get(2)
664        .and_then(|value| match value {
665            VmValue::Closure(closure) => Some(closure.clone()),
666            _ => None,
667        })
668        .ok_or_else(|| VmError::Runtime("dual_control: action must be a closure".to_string()))?;
669    let approvers = optional_string_list(args.get(3), "dual_control")?;
670    if !approvers.is_empty() && approvers.len() < m as usize {
671        return Err(VmError::Runtime(format!(
672            "dual_control: expected at least {m} approvers, got {}",
673            approvers.len()
674        )));
675    }
676
677    let keys = current_dispatch_keys();
678    let request_id = next_request_id(HitlRequestKind::DualControl, keys.as_ref());
679    let trace_id = keys
680        .as_ref()
681        .map(|keys| keys.trace_id.clone())
682        .unwrap_or_else(new_trace_id);
683    let action_name = if action.func.name.is_empty() {
684        "anonymous".to_string()
685    } else {
686        action.func.name.clone()
687    };
688    let agent = keys
689        .as_ref()
690        .map(|keys| keys.agent.clone())
691        .unwrap_or_default();
692    let requested_at_time = OffsetDateTime::now_utc();
693    let requested_at = format_rfc3339(requested_at_time);
694    let mut approval_request = ApprovalRequest::new(
695        request_id.clone(),
696        action_name.clone(),
697        json!({
698            "n": n,
699            "m": m,
700            "approvers": approvers.clone(),
701        }),
702        agent.clone(),
703        requested_at.clone(),
704    );
705    approval_request.deadline = deadline_after(
706        requested_at_time,
707        StdDuration::from_millis(HITL_APPROVAL_TIMEOUT_MS),
708    );
709    approval_request.approvers_required = n as u32;
710    approval_request.undo_metadata = crate::orchestration::current_mutation_session()
711        .and_then(|session| serde_json::to_value(session).ok())
712        .unwrap_or(JsonValue::Null);
713    let approval_request_json = serde_json::to_value(&approval_request)
714        .map_err(|error| VmError::Runtime(error.to_string()))?;
715    let log = ensure_hitl_event_log();
716    let request = HitlRequestEnvelope {
717        request_id: request_id.clone(),
718        kind: HitlRequestKind::DualControl,
719        agent,
720        trace_id: trace_id.clone(),
721        run_id: crate::orchestration::current_mutation_session().and_then(|session| session.run_id),
722        requested_at: requested_at.clone(),
723        payload: json!({
724            "approval_request": approval_request_json,
725            "id": approval_request.id,
726            "args": approval_request.args,
727            "principal": approval_request.principal,
728            "requested_at": requested_at,
729            "deadline": approval_request.deadline,
730            "approvers_required": approval_request.approvers_required,
731            "evidence_refs": approval_request.evidence_refs,
732            "undo_metadata": approval_request.undo_metadata,
733            "capabilities_requested": approval_request.capabilities_requested,
734            "n": n,
735            "m": m,
736            "action": action_name,
737            "approvers": approvers,
738            "deadline_ms": HITL_APPROVAL_TIMEOUT_MS,
739        }),
740    };
741    create_request_waitpoint(&log, &request).await?;
742    append_request(&log, &request).await?;
743    maybe_notify_host(Some(ctx), &request);
744    emit_hitl_requested(&request);
745    maybe_apply_mock_response(HitlRequestKind::DualControl, &request_id, &request.payload).await?;
746
747    match wait_for_request_waitpoint_with_events(
748        &request_id,
749        HitlRequestKind::DualControl,
750        Some(StdDuration::from_millis(HITL_APPROVAL_TIMEOUT_MS)),
751    )
752    .await?
753    {
754        WaitpointOutcome::Completed(record) => {
755            let _ = approval_record_from_waitpoint(&record, "dual_control")?;
756            let mut vm = ctx.child_vm();
757            let result = vm.call_closure_pub(&action, &[]).await?;
758            ctx.forward_output(&vm.take_output());
759
760            append_named_event(
761                &log,
762                HitlRequestKind::DualControl,
763                "hitl.dual_control_executed",
764                &request_id,
765                &trace_id,
766                json!({
767                    "request_id": request_id,
768                    "result": crate::llm::vm_value_to_json(&result),
769                }),
770            )
771            .await?;
772
773            Ok(result)
774        }
775        WaitpointOutcome::Timeout => {
776            append_timeout_once(&log, HitlRequestKind::DualControl, &request_id, &trace_id).await?;
777            Err(timeout_error(&request_id, HitlRequestKind::DualControl))
778        }
779        WaitpointOutcome::Cancelled { .. } => {
780            Err(approval_wait_error(&log, HitlRequestKind::DualControl, &request_id).await)
781        }
782    }
783}
784
785async fn escalate_to_impl(
786    ctx: Option<&AsyncBuiltinCtx>,
787    args: &[VmValue],
788) -> Result<VmValue, VmError> {
789    let role = required_string_arg(args, 0, "escalate_to")?;
790    let reason = required_string_arg(args, 1, "escalate_to")?;
791    let keys = current_dispatch_keys();
792    let request_id = next_request_id(HitlRequestKind::Escalation, keys.as_ref());
793    let trace_id = keys
794        .as_ref()
795        .map(|keys| keys.trace_id.clone())
796        .unwrap_or_else(new_trace_id);
797    let log = ensure_hitl_event_log();
798    let request = HitlRequestEnvelope {
799        request_id: request_id.clone(),
800        kind: HitlRequestKind::Escalation,
801        agent: keys
802            .as_ref()
803            .map(|keys| keys.agent.clone())
804            .unwrap_or_default(),
805        trace_id: trace_id.clone(),
806        run_id: crate::orchestration::current_mutation_session().and_then(|session| session.run_id),
807        requested_at: now_rfc3339(),
808        payload: json!({
809            "role": role,
810            "reason": reason,
811            "capability_policy": escalation_capability_policy(),
812        }),
813    };
814    create_request_waitpoint(&log, &request).await?;
815    append_request(&log, &request).await?;
816    maybe_notify_host(ctx, &request);
817    emit_hitl_requested(&request);
818    maybe_apply_mock_response(HitlRequestKind::Escalation, &request_id, &request.payload).await?;
819
820    match wait_for_request_waitpoint_with_events(&request_id, HitlRequestKind::Escalation, None)
821        .await?
822    {
823        WaitpointOutcome::Completed(record) => {
824            let accepted_at = record.completed_at.clone();
825            let reviewer = record.completed_by.clone();
826            let accepted = record
827                .value
828                .as_ref()
829                .and_then(|value| value.get("accepted"))
830                .and_then(JsonValue::as_bool)
831                .unwrap_or(true);
832            Ok(crate::stdlib::json_to_vm_value(&json!({
833                "request_id": request_id,
834                "role": role,
835                "reason": reason,
836                "trace_id": trace_id,
837                "status": if accepted { "accepted" } else { "pending" },
838                "accepted_at": accepted_at,
839                "reviewer": reviewer,
840            })))
841        }
842        WaitpointOutcome::Timeout => Err(timeout_error(&request_id, HitlRequestKind::Escalation)),
843        WaitpointOutcome::Cancelled {
844            wait_id,
845            waitpoint_ids,
846            reason,
847        } => Err(hitl_cancelled_error(
848            &request_id,
849            HitlRequestKind::Escalation,
850            &wait_id,
851            &waitpoint_ids,
852            reason,
853        )),
854    }
855}
856
857async fn create_request_waitpoint(
858    log: &Arc<AnyEventLog>,
859    request: &HitlRequestEnvelope,
860) -> Result<(), VmError> {
861    create_waitpoint_on(
862        log,
863        Some(request.request_id.clone()),
864        Some(json!({
865            "kind": request.kind.as_str(),
866            "agent": request.agent.clone(),
867            "trace_id": request.trace_id.clone(),
868            "requested_at": request.requested_at.clone(),
869            "payload": request.payload.clone(),
870        })),
871    )
872    .await?;
873    Ok(())
874}
875
876async fn wait_for_request_waitpoint(
877    request_id: &str,
878    timeout: Option<StdDuration>,
879) -> Result<WaitpointOutcome, VmError> {
880    match wait_on_waitpoints(
881        vec![request_id.to_string()],
882        WaitpointWaitOptions { timeout },
883    )
884    .await
885    {
886        Ok(records) => Ok(WaitpointOutcome::Completed(
887            records
888                .into_iter()
889                .next()
890                .expect("single waitpoint wait result"),
891        )),
892        Err(WaitpointWaitFailure::Timeout { .. }) => Ok(WaitpointOutcome::Timeout),
893        Err(WaitpointWaitFailure::Cancelled {
894            wait_id,
895            waitpoint_ids,
896            reason,
897        }) => Ok(WaitpointOutcome::Cancelled {
898            wait_id,
899            waitpoint_ids,
900            reason,
901        }),
902        Err(WaitpointWaitFailure::Vm(error)) => {
903            if let Some(outcome) = waitpoint_outcome_from_vm_error(&error) {
904                return Ok(outcome);
905            }
906            Err(error)
907        }
908    }
909}
910
911fn waitpoint_outcome_from_vm_error(error: &VmError) -> Option<WaitpointOutcome> {
912    let VmError::Thrown(VmValue::Dict(dict)) = error else {
913        return None;
914    };
915    let name = dict.get("name").and_then(vm_string)?;
916    match name {
917        "WaitpointTimeoutError" => Some(WaitpointOutcome::Timeout),
918        "WaitpointCancelledError" => Some(WaitpointOutcome::Cancelled {
919            wait_id: dict
920                .get("wait_id")
921                .and_then(vm_string)
922                .unwrap_or_default()
923                .to_string(),
924            waitpoint_ids: dict
925                .get("waitpoint_ids")
926                .and_then(vm_string_list)
927                .unwrap_or_default(),
928            reason: dict
929                .get("reason")
930                .and_then(vm_string)
931                .map(ToString::to_string),
932        }),
933        _ => None,
934    }
935}
936
937async fn finalize_hitl_response(
938    log: &Arc<AnyEventLog>,
939    kind: HitlRequestKind,
940    response: &HitlHostResponse,
941) -> Result<(), String> {
942    match kind {
943        HitlRequestKind::Question => {
944            if waitpoint_is_terminal(log, &response.request_id).await? {
945                return Ok(());
946            }
947            complete_waitpoint_on(
948                log,
949                &response.request_id,
950                response.answer.clone(),
951                response.reviewer.clone(),
952                response.reason.clone(),
953                response.metadata.clone(),
954            )
955            .await
956            .map(|_| ())
957            .map_err(|error| error.to_string())
958        }
959        HitlRequestKind::Escalation => {
960            if !response.accepted.unwrap_or(false)
961                || waitpoint_is_terminal(log, &response.request_id).await?
962            {
963                return Ok(());
964            }
965            complete_waitpoint_on(
966                log,
967                &response.request_id,
968                Some(json!({
969                    "accepted": true,
970                    "reviewer": response.reviewer,
971                    "reason": response.reason,
972                    "responded_at": response.responded_at,
973                })),
974                response.reviewer.clone(),
975                response.reason.clone(),
976                response.metadata.clone(),
977            )
978            .await
979            .map(|_| ())
980            .map_err(|error| error.to_string())
981        }
982        HitlRequestKind::Approval | HitlRequestKind::DualControl => {
983            if waitpoint_is_terminal(log, &response.request_id).await? {
984                return Ok(());
985            }
986            let request = load_request_envelope(log, kind, &response.request_id)
987                .await
988                .map_err(|error| error.to_string())?;
989            match resolve_approval_state(log, kind, &request)
990                .await
991                .map_err(|error| error.to_string())?
992            {
993                ApprovalResolution::Pending => Ok(()),
994                ApprovalResolution::Approved(progress) => {
995                    let record = approval_record_json(&progress);
996                    append_named_event(
997                        log,
998                        kind,
999                        approved_event_kind(kind),
1000                        &request.request_id,
1001                        &request.trace_id,
1002                        json!({
1003                            "request_id": request.request_id.clone(),
1004                            "record": record.clone(),
1005                        }),
1006                    )
1007                    .await
1008                    .map_err(|error| error.to_string())?;
1009                    complete_waitpoint_on(
1010                        log,
1011                        &request.request_id,
1012                        Some(record),
1013                        response.reviewer.clone(),
1014                        progress.reason.clone(),
1015                        response.metadata.clone(),
1016                    )
1017                    .await
1018                    .map(|_| ())
1019                    .map_err(|error| error.to_string())
1020                }
1021                ApprovalResolution::Denied(denied) => {
1022                    append_named_event(
1023                        log,
1024                        kind,
1025                        denied_event_kind(kind),
1026                        &request.request_id,
1027                        &request.trace_id,
1028                        json!({
1029                            "request_id": request.request_id.clone(),
1030                            "reviewer": denied.reviewer.clone(),
1031                            "reason": denied.reason.clone(),
1032                        }),
1033                    )
1034                    .await
1035                    .map_err(|error| error.to_string())?;
1036                    cancel_waitpoint_on(
1037                        log,
1038                        &request.request_id,
1039                        denied.reviewer.clone(),
1040                        denied.reason.clone(),
1041                        denied.metadata.clone(),
1042                    )
1043                    .await
1044                    .map(|_| ())
1045                    .map_err(|error| error.to_string())
1046                }
1047            }
1048        }
1049    }
1050}
1051
1052async fn waitpoint_is_terminal(log: &Arc<AnyEventLog>, request_id: &str) -> Result<bool, String> {
1053    Ok(inspect_waitpoint_on(log, request_id)
1054        .await
1055        .map_err(|error| error.to_string())?
1056        .is_some_and(|record| record.status != WaitpointStatus::Open))
1057}
1058
1059async fn load_request_envelope(
1060    log: &Arc<AnyEventLog>,
1061    kind: HitlRequestKind,
1062    request_id: &str,
1063) -> Result<HitlRequestEnvelope, VmError> {
1064    let topic = topic(kind)?;
1065    let events = log
1066        .read_range(&topic, None, usize::MAX)
1067        .await
1068        .map_err(log_error)?;
1069    events
1070        .into_iter()
1071        .filter(|(_, event)| event.kind == kind.request_event_kind())
1072        .find_map(|(_, event)| {
1073            if !event_matches_request(&event, request_id) {
1074                return None;
1075            }
1076            serde_json::from_value::<HitlRequestEnvelope>(event.payload).ok()
1077        })
1078        .ok_or_else(|| {
1079            VmError::Runtime(format!("missing HITL request envelope for '{request_id}'"))
1080        })
1081}
1082
1083async fn resolve_approval_state(
1084    log: &Arc<AnyEventLog>,
1085    kind: HitlRequestKind,
1086    request: &HitlRequestEnvelope,
1087) -> Result<ApprovalResolution, VmError> {
1088    let quorum = approval_quorum_from_request(kind, request)?;
1089    let allowed_reviewers = approval_reviewers_from_request(kind, request)
1090        .into_iter()
1091        .collect::<BTreeSet<_>>();
1092    let mut progress = ApprovalProgress {
1093        request_id: request.request_id.clone(),
1094        reviewers: BTreeSet::new(),
1095        signatures: Vec::new(),
1096        reason: None,
1097        approved_at: None,
1098    };
1099    let topic = topic(kind)?;
1100    let events = log
1101        .read_range(&topic, None, usize::MAX)
1102        .await
1103        .map_err(log_error)?;
1104    for (_, event) in events {
1105        if !event_matches_request(&event, &request.request_id)
1106            || event.kind != "hitl.response_received"
1107        {
1108            continue;
1109        }
1110        let response: HitlHostResponse = serde_json::from_value(event.payload)
1111            .map_err(|error| VmError::Runtime(error.to_string()))?;
1112        if let Some(reviewer) = response.reviewer.as_deref() {
1113            if !allowed_reviewers.is_empty() && !allowed_reviewers.contains(reviewer) {
1114                continue;
1115            }
1116            if progress.reviewers.contains(reviewer) {
1117                continue;
1118            }
1119        }
1120        if response.approved.unwrap_or(false) {
1121            if let Some(reviewer) = response.reviewer.clone() {
1122                let signed_at = response.responded_at.clone().unwrap_or_else(now_rfc3339);
1123                progress.reviewers.insert(reviewer.clone());
1124                progress.signatures.push(ApprovalSignature {
1125                    reviewer: reviewer.clone(),
1126                    signed_at: signed_at.clone(),
1127                    signature: response.signature.clone().unwrap_or_else(|| {
1128                        approval_receipt_signature(
1129                            &request.request_id,
1130                            &reviewer,
1131                            &signed_at,
1132                            true,
1133                            response.reason.as_deref(),
1134                        )
1135                    }),
1136                });
1137            }
1138            progress.reason = response.reason.clone();
1139            progress.approved_at = response.responded_at.clone();
1140            if progress.reviewers.len() as u32 >= quorum {
1141                return Ok(ApprovalResolution::Approved(progress));
1142            }
1143            continue;
1144        }
1145        return Ok(ApprovalResolution::Denied(response));
1146    }
1147    Ok(ApprovalResolution::Pending)
1148}
1149
1150fn approval_quorum_from_request(
1151    kind: HitlRequestKind,
1152    request: &HitlRequestEnvelope,
1153) -> Result<u32, VmError> {
1154    let key = match kind {
1155        HitlRequestKind::DualControl => "n",
1156        _ => "quorum",
1157    };
1158    let quorum = request
1159        .payload
1160        .get(key)
1161        .or_else(|| request.payload.get("approvers_required"))
1162        .or_else(|| {
1163            request
1164                .payload
1165                .get("approval_request")
1166                .and_then(|approval| approval.get("approvers_required"))
1167        })
1168        .and_then(JsonValue::as_u64)
1169        .unwrap_or(1);
1170    u32::try_from(quorum).map_err(|_| {
1171        VmError::Runtime(format!(
1172            "invalid quorum in HITL request '{}'",
1173            request.request_id
1174        ))
1175    })
1176}
1177
1178fn approval_reviewers_from_request(
1179    kind: HitlRequestKind,
1180    request: &HitlRequestEnvelope,
1181) -> Vec<String> {
1182    let key = match kind {
1183        HitlRequestKind::DualControl => "approvers",
1184        _ => "reviewers",
1185    };
1186    request
1187        .payload
1188        .get(key)
1189        .or_else(|| {
1190            request
1191                .payload
1192                .get("approval_request")
1193                .and_then(|approval| approval.get("reviewers"))
1194        })
1195        .and_then(JsonValue::as_array)
1196        .map(|values| {
1197            values
1198                .iter()
1199                .filter_map(JsonValue::as_str)
1200                .map(str::to_string)
1201                .collect()
1202        })
1203        .unwrap_or_default()
1204}
1205
1206fn approval_record_json(progress: &ApprovalProgress) -> JsonValue {
1207    json!({
1208        "request_id": progress.request_id.clone(),
1209        "approved": true,
1210        "reviewers": progress.reviewers.iter().cloned().collect::<Vec<_>>(),
1211        "approved_at": progress.approved_at.clone().unwrap_or_else(now_rfc3339),
1212        "reason": progress.reason,
1213        "signatures": progress.signatures,
1214    })
1215}
1216
1217fn approval_receipt_signature(
1218    request_id: &str,
1219    reviewer: &str,
1220    signed_at: &str,
1221    approved: bool,
1222    reason: Option<&str>,
1223) -> String {
1224    let material = format!(
1225        "harn-hitl-approval-v1\nrequest_id:{request_id}\nreviewer:{reviewer}\nsigned_at:{signed_at}\napproved:{approved}\nreason:{}\n",
1226        reason.unwrap_or("")
1227    );
1228    let hash = sha2::Sha256::digest(material.as_bytes());
1229    let hex: String = hash.iter().map(|byte| format!("{byte:02x}")).collect();
1230    format!("sha256:{hex}")
1231}
1232
1233fn approval_record_from_waitpoint(
1234    record: &WaitpointRecord,
1235    builtin: &str,
1236) -> Result<VmValue, VmError> {
1237    record
1238        .value
1239        .as_ref()
1240        .map(crate::stdlib::json_to_vm_value)
1241        .ok_or_else(|| VmError::Runtime(format!("{builtin}: missing approval record")))
1242}
1243
1244async fn approval_wait_error(
1245    log: &Arc<AnyEventLog>,
1246    kind: HitlRequestKind,
1247    request_id: &str,
1248) -> VmError {
1249    if let Ok(Some(record)) = inspect_waitpoint_on(log, request_id).await {
1250        if record.status == WaitpointStatus::Cancelled
1251            && record.reason.as_deref() != Some("upstream_cancelled")
1252        {
1253            return approval_denied_error(
1254                request_id,
1255                HitlHostResponse {
1256                    request_id: request_id.to_string(),
1257                    answer: None,
1258                    approved: Some(false),
1259                    accepted: None,
1260                    reviewer: record.cancelled_by.clone(),
1261                    reason: record.reason.clone(),
1262                    metadata: record.metadata.clone(),
1263                    responded_at: record.cancelled_at,
1264                    signature: None,
1265                },
1266            );
1267        }
1268        if record.status == WaitpointStatus::Cancelled {
1269            return hitl_cancelled_error(
1270                request_id,
1271                kind,
1272                "",
1273                &[request_id.to_string()],
1274                record.reason,
1275            );
1276        }
1277    }
1278    hitl_cancelled_error(
1279        request_id,
1280        kind,
1281        "",
1282        &[request_id.to_string()],
1283        Some("upstream_cancelled".to_string()),
1284    )
1285}
1286
1287async fn append_timeout_once(
1288    log: &Arc<AnyEventLog>,
1289    kind: HitlRequestKind,
1290    request_id: &str,
1291    trace_id: &str,
1292) -> Result<(), VmError> {
1293    if hitl_event_exists(log, kind, request_id, "hitl.timeout").await? {
1294        return Ok(());
1295    }
1296    append_timeout(log, kind, request_id, trace_id).await
1297}
1298
1299async fn hitl_event_exists(
1300    log: &Arc<AnyEventLog>,
1301    kind: HitlRequestKind,
1302    request_id: &str,
1303    event_kind: &str,
1304) -> Result<bool, VmError> {
1305    let topic = topic(kind)?;
1306    let events = log
1307        .read_range(&topic, None, usize::MAX)
1308        .await
1309        .map_err(log_error)?;
1310    Ok(events
1311        .into_iter()
1312        .any(|(_, event)| event.kind == event_kind && event_matches_request(&event, request_id)))
1313}
1314
1315fn approved_event_kind(kind: HitlRequestKind) -> &'static str {
1316    match kind {
1317        HitlRequestKind::DualControl => "hitl.dual_control_approved",
1318        _ => "hitl.approval_approved",
1319    }
1320}
1321
1322fn denied_event_kind(kind: HitlRequestKind) -> &'static str {
1323    match kind {
1324        HitlRequestKind::DualControl => "hitl.dual_control_denied",
1325        _ => "hitl.approval_denied",
1326    }
1327}
1328
1329async fn append_request(
1330    log: &Arc<AnyEventLog>,
1331    request: &HitlRequestEnvelope,
1332) -> Result<(), VmError> {
1333    let topic = topic(request.kind)?;
1334    log.append(
1335        &topic,
1336        LogEvent::new(
1337            request.kind.request_event_kind(),
1338            serde_json::to_value(request).map_err(|error| VmError::Runtime(error.to_string()))?,
1339        )
1340        .with_headers(request_headers(request)),
1341    )
1342    .await
1343    .map(|_| ())
1344    .map_err(log_error)
1345}
1346
1347async fn append_named_event(
1348    log: &Arc<AnyEventLog>,
1349    kind: HitlRequestKind,
1350    event_kind: &str,
1351    request_id: &str,
1352    trace_id: &str,
1353    payload: JsonValue,
1354) -> Result<(), VmError> {
1355    let topic = topic(kind)?;
1356    let headers = headers_with_trace(request_id, trace_id);
1357    log.append(
1358        &topic,
1359        LogEvent::new(event_kind, payload).with_headers(headers),
1360    )
1361    .await
1362    .map(|_| ())
1363    .map_err(log_error)
1364}
1365
1366async fn append_timeout(
1367    log: &Arc<AnyEventLog>,
1368    kind: HitlRequestKind,
1369    request_id: &str,
1370    trace_id: &str,
1371) -> Result<(), VmError> {
1372    append_named_event(
1373        log,
1374        kind,
1375        "hitl.timeout",
1376        request_id,
1377        trace_id,
1378        serde_json::to_value(HitlTimeoutRecord {
1379            request_id: request_id.to_string(),
1380            kind,
1381            trace_id: trace_id.to_string(),
1382            timed_out_at: now_rfc3339(),
1383        })
1384        .map_err(|error| VmError::Runtime(error.to_string()))?,
1385    )
1386    .await
1387}
1388
1389async fn maybe_apply_mock_response(
1390    kind: HitlRequestKind,
1391    request_id: &str,
1392    request_payload: &JsonValue,
1393) -> Result<(), VmError> {
1394    let mut params = request_payload
1395        .as_object()
1396        .cloned()
1397        .unwrap_or_default()
1398        .into_iter()
1399        .map(|(key, value)| (key, crate::stdlib::json_to_vm_value(&value)))
1400        .collect::<crate::value::DictMap>();
1401    params.put_str("request_id", request_id);
1402    let Some(result) = dispatch_mock_host_call("hitl", kind.as_str(), &params) else {
1403        return Ok(());
1404    };
1405    let value = result?;
1406    let responses = match value {
1407        VmValue::List(items) => items.iter().cloned().collect::<Vec<_>>(),
1408        other => vec![other],
1409    };
1410    for response in responses {
1411        let response_dict = response.as_dict().ok_or_else(|| {
1412            VmError::Runtime(format!(
1413                "mocked HITL {} response must be a dict or list<dict>",
1414                kind.as_str()
1415            ))
1416        })?;
1417        let hitl_response = parse_hitl_response_dict(request_id, response_dict)?;
1418        append_hitl_response(None, hitl_response)
1419            .await
1420            .map_err(VmError::Runtime)?;
1421    }
1422    Ok(())
1423}
1424
1425fn parse_hitl_response_dict(
1426    request_id: &str,
1427    response_dict: &crate::value::DictMap,
1428) -> Result<HitlHostResponse, VmError> {
1429    Ok(HitlHostResponse {
1430        request_id: request_id.to_string(),
1431        answer: response_dict
1432            .get("answer")
1433            .map(crate::llm::vm_value_to_json),
1434        approved: response_dict.get("approved").and_then(vm_bool),
1435        accepted: response_dict.get("accepted").and_then(vm_bool),
1436        reviewer: response_dict.get("reviewer").map(VmValue::display),
1437        reason: response_dict.get("reason").map(VmValue::display),
1438        metadata: response_dict
1439            .get("metadata")
1440            .map(crate::llm::vm_value_to_json),
1441        responded_at: response_dict.get("responded_at").map(VmValue::display),
1442        signature: response_dict.get("signature").map(VmValue::display),
1443    })
1444}
1445
1446fn maybe_notify_host(ctx: Option<&AsyncBuiltinCtx>, request: &HitlRequestEnvelope) {
1447    let Some(bridge) = ctx.and_then(|ctx| ctx.child_vm().bridge.clone()) else {
1448        return;
1449    };
1450    bridge.notify(
1451        "harn.hitl.requested",
1452        serde_json::to_value(request).unwrap_or(JsonValue::Null),
1453    );
1454}
1455
1456/// Emit a `HitlRequested` `AgentEvent` so transport adapters
1457/// (currently the A2A `A2aWorkerSink`) can flip a task into
1458/// `input-required` while the script is suspended on the waitpoint.
1459/// No-op when there is no current agent session — the bridge-level
1460/// `harn.hitl.requested` notification still fires for hosts that drive
1461/// HITL UX through the bridge.
1462fn emit_hitl_requested(request: &HitlRequestEnvelope) {
1463    let Some(session_id) = crate::agent_sessions::current_session_id() else {
1464        return;
1465    };
1466    crate::agent_events::emit_event(&crate::agent_events::AgentEvent::HitlRequested {
1467        session_id,
1468        request_id: request.request_id.clone(),
1469        kind: request.kind.as_str().to_string(),
1470        payload: request.payload.clone(),
1471    });
1472}
1473
1474/// Companion to `emit_hitl_requested`: notifies sinks that the
1475/// suspended waitpoint has resolved so a paused task can flip back
1476/// out of `input-required`. `outcome` is one of `"answered"`,
1477/// `"timeout"`, `"cancelled"`, or `"error"`.
1478fn emit_hitl_resolved(request_id: &str, kind: HitlRequestKind, outcome: &str) {
1479    let Some(session_id) = crate::agent_sessions::current_session_id() else {
1480        return;
1481    };
1482    crate::agent_events::emit_event(&crate::agent_events::AgentEvent::HitlResolved {
1483        session_id,
1484        request_id: request_id.to_string(),
1485        kind: kind.as_str().to_string(),
1486        outcome: outcome.to_string(),
1487    });
1488}
1489
1490/// Wrapper around `wait_for_request_waitpoint` that emits the
1491/// canonical `HitlResolved` `AgentEvent` regardless of which terminal
1492/// branch the waitpoint takes (response / timeout / cancellation /
1493/// error). Pair-emitted with `emit_hitl_requested` so transport
1494/// adapters can bracket the `input-required` pause cleanly without
1495/// each `*_impl` having to duplicate the emission at every match arm.
1496async fn wait_for_request_waitpoint_with_events(
1497    request_id: &str,
1498    kind: HitlRequestKind,
1499    timeout: Option<StdDuration>,
1500) -> Result<WaitpointOutcome, VmError> {
1501    let outcome = wait_for_request_waitpoint(request_id, timeout).await;
1502    let label = match &outcome {
1503        Ok(WaitpointOutcome::Completed(_)) => "answered",
1504        Ok(WaitpointOutcome::Timeout) => "timeout",
1505        Ok(WaitpointOutcome::Cancelled { .. }) => "cancelled",
1506        Err(_) => "error",
1507    };
1508    emit_hitl_resolved(request_id, kind, label);
1509    outcome
1510}
1511
1512fn parse_ask_user_options(value: Option<&VmValue>) -> Result<AskUserOptions, VmError> {
1513    let Some(value) = value else {
1514        return Ok(AskUserOptions {
1515            schema: None,
1516            timeout: Some(default_question_timeout()),
1517            default: None,
1518        });
1519    };
1520    let dict = value
1521        .as_dict()
1522        .ok_or_else(|| VmError::Runtime("ask_user: options must be a dict".to_string()))?;
1523    Ok(AskUserOptions {
1524        schema: dict
1525            .get("schema")
1526            .cloned()
1527            .filter(|value| !matches!(value, VmValue::Nil)),
1528        timeout: dict
1529            .get("timeout")
1530            .map(parse_duration_value)
1531            .transpose()?
1532            .or_else(|| Some(default_question_timeout())),
1533        default: dict
1534            .get("default")
1535            .cloned()
1536            .filter(|value| !matches!(value, VmValue::Nil)),
1537    })
1538}
1539
1540fn default_question_timeout() -> StdDuration {
1541    StdDuration::from_millis(HITL_QUESTION_TIMEOUT_MS)
1542}
1543
1544fn escalation_capability_policy() -> JsonValue {
1545    crate::orchestration::current_execution_policy()
1546        .and_then(|policy| serde_json::to_value(policy).ok())
1547        .unwrap_or(JsonValue::Null)
1548}
1549
1550fn parse_approval_options(
1551    value: Option<&VmValue>,
1552    builtin: &str,
1553) -> Result<ApprovalOptions, VmError> {
1554    let dict = match value {
1555        None => None,
1556        Some(VmValue::Dict(dict)) => Some(dict),
1557        Some(_) => {
1558            return Err(VmError::Runtime(format!(
1559                "{builtin}: options must be a dict"
1560            )))
1561        }
1562    };
1563    let quorum = dict
1564        .and_then(|dict| dict.get("quorum"))
1565        .and_then(VmValue::as_int)
1566        .unwrap_or(1);
1567    if quorum <= 0 {
1568        return Err(VmError::Runtime(format!(
1569            "{builtin}: quorum must be positive"
1570        )));
1571    }
1572    let reviewers = optional_string_list(dict.and_then(|dict| dict.get("reviewers")), builtin)?;
1573    let capabilities_requested = optional_string_list(
1574        dict.and_then(|dict| dict.get("capabilities_requested")),
1575        builtin,
1576    )?;
1577    let evidence_refs = dict
1578        .and_then(|dict| dict.get("evidence_refs"))
1579        .map(|value| match value {
1580            VmValue::List(items) => Ok(items
1581                .iter()
1582                .map(crate::llm::vm_value_to_json)
1583                .collect::<Vec<_>>()),
1584            _ => Err(VmError::Runtime(format!(
1585                "{builtin}: evidence_refs must be a list"
1586            ))),
1587        })
1588        .transpose()?
1589        .unwrap_or_default();
1590    let deadline = dict
1591        .and_then(|dict| dict.get("deadline"))
1592        .map(parse_duration_value)
1593        .transpose()?
1594        .unwrap_or_else(|| StdDuration::from_millis(HITL_APPROVAL_TIMEOUT_MS));
1595    Ok(ApprovalOptions {
1596        detail: dict.and_then(|dict| dict.get("detail")).cloned(),
1597        args: dict.and_then(|dict| dict.get("args")).cloned(),
1598        quorum: quorum as u32,
1599        reviewers,
1600        deadline,
1601        principal: dict
1602            .and_then(|dict| dict.get("principal"))
1603            .map(VmValue::display)
1604            .filter(|value| !value.is_empty()),
1605        evidence_refs,
1606        undo_metadata: dict
1607            .and_then(|dict| dict.get("undo_metadata"))
1608            .map(crate::llm::vm_value_to_json),
1609        capabilities_requested,
1610    })
1611}
1612
1613fn required_string_arg(args: &[VmValue], idx: usize, builtin: &str) -> Result<String, VmError> {
1614    args.get(idx)
1615        .map(VmValue::display)
1616        .filter(|value| !value.is_empty())
1617        .ok_or_else(|| VmError::Runtime(format!("{builtin}: expected string argument at {idx}")))
1618}
1619
1620fn required_positive_int_arg(args: &[VmValue], idx: usize, builtin: &str) -> Result<i64, VmError> {
1621    let value = args
1622        .get(idx)
1623        .and_then(VmValue::as_int)
1624        .ok_or_else(|| VmError::Runtime(format!("{builtin}: expected int argument at {idx}")))?;
1625    if value <= 0 {
1626        return Err(VmError::Runtime(format!(
1627            "{builtin}: expected a positive int at {idx}"
1628        )));
1629    }
1630    Ok(value)
1631}
1632
1633fn optional_string_list(value: Option<&VmValue>, builtin: &str) -> Result<Vec<String>, VmError> {
1634    let Some(value) = value else {
1635        return Ok(Vec::new());
1636    };
1637    match value {
1638        VmValue::List(list) => Ok(list.iter().map(VmValue::display).collect()),
1639        _ => Err(VmError::Runtime(format!(
1640            "{builtin}: expected list<string>"
1641        ))),
1642    }
1643}
1644
1645fn parse_duration_value(value: &VmValue) -> Result<StdDuration, VmError> {
1646    duration_from_value(value, "hitl", "timeout", ErrorKind::Runtime)
1647}
1648
1649fn ensure_hitl_event_log() -> Arc<AnyEventLog> {
1650    active_event_log()
1651        .unwrap_or_else(|| install_memory_for_current_thread(HITL_EVENT_LOG_QUEUE_DEPTH))
1652}
1653
1654fn ensure_hitl_event_log_for(base_dir: Option<&Path>) -> Result<Arc<AnyEventLog>, String> {
1655    if let Some(log) = active_event_log() {
1656        return Ok(log);
1657    }
1658    let Some(base_dir) = base_dir else {
1659        return Ok(install_memory_for_current_thread(
1660            HITL_EVENT_LOG_QUEUE_DEPTH,
1661        ));
1662    };
1663    install_default_for_base_dir(base_dir).map_err(|error| error.to_string())
1664}
1665
1666fn current_dispatch_keys() -> Option<DispatchKeys> {
1667    let context = current_dispatch_context()?;
1668    let stable_base = context
1669        .replay_of_event_id
1670        .clone()
1671        .unwrap_or_else(|| context.trigger_event.id.0.clone());
1672    let instance_key = format!(
1673        "{}::{}",
1674        context.trigger_event.id.0,
1675        context.replay_of_event_id.as_deref().unwrap_or("live")
1676    );
1677    Some(DispatchKeys {
1678        instance_key,
1679        stable_base,
1680        agent: context.agent_id,
1681        trace_id: context.trigger_event.trace_id.0,
1682    })
1683}
1684
1685fn next_request_id(kind: HitlRequestKind, dispatch_keys: Option<&DispatchKeys>) -> String {
1686    if let Some(keys) = dispatch_keys {
1687        let seq = REQUEST_SEQUENCE.with(|slot| {
1688            let mut state = slot.borrow_mut();
1689            if state.instance_key != keys.instance_key {
1690                state.instance_key = keys.instance_key.clone();
1691                state.next_seq = 0;
1692            }
1693            state.next_seq += 1;
1694            state.next_seq
1695        });
1696        return format!("hitl_{}_{}_{}", kind.as_str(), keys.stable_base, seq);
1697    }
1698    format!("hitl_{}_{}", kind.as_str(), Uuid::now_v7())
1699}
1700
1701fn request_headers(request: &HitlRequestEnvelope) -> BTreeMap<String, String> {
1702    let mut headers = headers_with_trace(&request.request_id, &request.trace_id);
1703    if let Some(run_id) = request.run_id.as_ref() {
1704        headers.insert("run_id".to_string(), run_id.clone());
1705    }
1706    headers
1707}
1708
1709fn response_headers(request_id: &str) -> BTreeMap<String, String> {
1710    let mut headers = std::collections::BTreeMap::new();
1711    headers.insert("request_id".to_string(), request_id.to_string());
1712    headers
1713}
1714
1715fn headers_with_trace(request_id: &str, trace_id: &str) -> BTreeMap<String, String> {
1716    let mut headers = response_headers(request_id);
1717    headers.insert("trace_id".to_string(), trace_id.to_string());
1718    headers
1719}
1720
1721fn topic(kind: HitlRequestKind) -> Result<Topic, VmError> {
1722    Topic::new(kind.topic()).map_err(|error| VmError::Runtime(error.to_string()))
1723}
1724
1725fn event_matches_request(event: &LogEvent, request_id: &str) -> bool {
1726    event
1727        .headers
1728        .get("request_id")
1729        .is_some_and(|value| value == request_id)
1730        || event
1731            .payload
1732            .get("request_id")
1733            .and_then(JsonValue::as_str)
1734            .is_some_and(|value| value == request_id)
1735}
1736
1737fn approval_denied_error(request_id: &str, response: HitlHostResponse) -> VmError {
1738    VmError::Thrown(crate::stdlib::json_to_vm_value(&json!({
1739        "name": "ApprovalDeniedError",
1740        "category": "generic",
1741        "message": response.reason.clone().unwrap_or_else(|| "approval was denied".to_string()),
1742        "request_id": request_id,
1743        "reviewers": response.reviewer.into_iter().collect::<Vec<_>>(),
1744        "reason": response.reason,
1745    })))
1746}
1747
1748fn hitl_cancelled_error(
1749    request_id: &str,
1750    kind: HitlRequestKind,
1751    wait_id: &str,
1752    waitpoint_ids: &[String],
1753    reason: Option<String>,
1754) -> VmError {
1755    let _ = categorized_error("HITL cancelled", ErrorCategory::Cancelled);
1756    let message = reason
1757        .clone()
1758        .unwrap_or_else(|| format!("{} cancelled", kind.as_str()));
1759    VmError::Thrown(crate::stdlib::json_to_vm_value(&json!({
1760        "name": "HumanCancelledError",
1761        "category": ErrorCategory::Cancelled.as_str(),
1762        "message": message,
1763        "request_id": request_id,
1764        "kind": kind.as_str(),
1765        "wait_id": wait_id,
1766        "waitpoint_ids": waitpoint_ids,
1767        "reason": reason,
1768    })))
1769}
1770
1771fn timeout_error(request_id: &str, kind: HitlRequestKind) -> VmError {
1772    let _ = categorized_error("HITL timed out", ErrorCategory::Timeout);
1773    VmError::Thrown(crate::stdlib::json_to_vm_value(&json!({
1774        "name": "HumanTimeoutError",
1775        "category": ErrorCategory::Timeout.as_str(),
1776        "message": format!("{} timed out", kind.as_str()),
1777        "request_id": request_id,
1778        "kind": kind.as_str(),
1779    })))
1780}
1781
1782fn coerce_like_default(value: &VmValue, default: &VmValue) -> VmValue {
1783    match default {
1784        VmValue::Int(_) => match value {
1785            VmValue::Int(_) => value.clone(),
1786            VmValue::Float(number) => VmValue::Int(*number as i64),
1787            VmValue::String(text) => text
1788                .parse::<i64>()
1789                .map(VmValue::Int)
1790                .unwrap_or_else(|_| default.clone()),
1791            _ => default.clone(),
1792        },
1793        VmValue::Float(_) => match value {
1794            VmValue::Float(_) => value.clone(),
1795            VmValue::Int(number) => VmValue::Float(*number as f64),
1796            VmValue::String(text) => text
1797                .parse::<f64>()
1798                .map(VmValue::Float)
1799                .unwrap_or_else(|_| default.clone()),
1800            _ => default.clone(),
1801        },
1802        VmValue::Bool(_) => match value {
1803            VmValue::Bool(_) => value.clone(),
1804            VmValue::String(text) if text.eq_ignore_ascii_case("true") => VmValue::Bool(true),
1805            VmValue::String(text) if text.eq_ignore_ascii_case("false") => VmValue::Bool(false),
1806            _ => default.clone(),
1807        },
1808        VmValue::String(_) => VmValue::String(std::sync::Arc::from(value.display())),
1809        VmValue::Duration(_) => match value {
1810            VmValue::Duration(_) => value.clone(),
1811            VmValue::Int(ms) => VmValue::Duration(*ms),
1812            _ => default.clone(),
1813        },
1814        VmValue::Nil => value.clone(),
1815        _ => {
1816            if value.type_name() == default.type_name() {
1817                value.clone()
1818            } else {
1819                default.clone()
1820            }
1821        }
1822    }
1823}
1824
1825fn log_error(error: impl std::fmt::Display) -> VmError {
1826    VmError::Runtime(error.to_string())
1827}
1828
1829fn now_rfc3339() -> String {
1830    format_rfc3339(OffsetDateTime::now_utc())
1831}
1832
1833fn format_rfc3339(timestamp: OffsetDateTime) -> String {
1834    timestamp
1835        .format(&Rfc3339)
1836        .unwrap_or_else(|_| timestamp.to_string())
1837}
1838
1839fn deadline_after(requested_at: OffsetDateTime, duration: StdDuration) -> Option<String> {
1840    time::Duration::try_from(duration)
1841        .ok()
1842        .map(|duration| format_rfc3339(requested_at + duration))
1843}
1844
1845fn new_trace_id() -> String {
1846    format!("trace_{}", Uuid::now_v7())
1847}
1848
1849fn vm_bool(value: &VmValue) -> Option<bool> {
1850    match value {
1851        VmValue::Bool(flag) => Some(*flag),
1852        _ => None,
1853    }
1854}
1855
1856fn vm_string(value: &VmValue) -> Option<&str> {
1857    match value {
1858        VmValue::String(text) => Some(text.as_ref()),
1859        _ => None,
1860    }
1861}
1862
1863fn vm_string_list(value: &VmValue) -> Option<Vec<String>> {
1864    match value {
1865        VmValue::List(values) => Some(values.iter().map(VmValue::display).collect()),
1866        _ => None,
1867    }
1868}
1869
1870#[cfg(test)]
1871mod tests {
1872    use std::sync::OnceLock;
1873
1874    use tokio::sync::Mutex;
1875
1876    use super::{
1877        HITL_APPROVALS_TOPIC, HITL_DUAL_CONTROL_TOPIC, HITL_ESCALATIONS_TOPIC, HITL_QUESTIONS_TOPIC,
1878    };
1879    use crate::event_log::{install_default_for_base_dir, EventLog, Topic};
1880    use crate::{compile_source, register_vm_stdlib, reset_thread_local_state, Vm, VmError};
1881
1882    /// Serialize tests that exercise the request-approval path. Those tests
1883    /// drive the Harn VM through its full HITL state machine and rely on
1884    /// thread-local event-log handles that are set up by
1885    /// `execute_hitl_script` → `reset_thread_local_state()`. Under heavy
1886    /// parallel load the OS thread that a `current_thread` tokio runtime
1887    /// runs on can be reused between tests; if the outgoing test's async
1888    /// drop runs concurrently with the incoming test's reset the thread-
1889    /// local event log is in a transitional state and events can be double-
1890    /// counted or missed. Holding this mutex for the duration of each test
1891    /// turns the hazard into a hard serialize.
1892    fn hitl_lock() -> &'static Mutex<()> {
1893        static LOCK: OnceLock<Mutex<()>> = OnceLock::new();
1894        LOCK.get_or_init(|| Mutex::new(()))
1895    }
1896
1897    async fn execute_hitl_script(
1898        base_dir: &std::path::Path,
1899        source: &str,
1900    ) -> Result<(String, Vec<String>, Vec<String>, Vec<String>, Vec<String>), VmError> {
1901        reset_thread_local_state();
1902        let log = install_default_for_base_dir(base_dir).expect("install event log");
1903        let chunk = compile_source(source).expect("compile source");
1904        let mut vm = Vm::new();
1905        register_vm_stdlib(&mut vm);
1906        vm.set_source_dir(base_dir);
1907        vm.execute(&chunk).await?;
1908        let output = vm.output().trim_end().to_string();
1909        let question_events = event_kinds(log.clone(), HITL_QUESTIONS_TOPIC).await;
1910        let approval_events = event_kinds(log.clone(), HITL_APPROVALS_TOPIC).await;
1911        let dual_control_events = event_kinds(log.clone(), HITL_DUAL_CONTROL_TOPIC).await;
1912        let escalation_events = event_kinds(log, HITL_ESCALATIONS_TOPIC).await;
1913        Ok((
1914            output,
1915            question_events,
1916            approval_events,
1917            dual_control_events,
1918            escalation_events,
1919        ))
1920    }
1921
1922    async fn event_kinds(
1923        log: std::sync::Arc<crate::event_log::AnyEventLog>,
1924        topic: &str,
1925    ) -> Vec<String> {
1926        log.read_range(&Topic::new(topic).expect("valid topic"), None, usize::MAX)
1927            .await
1928            .expect("read topic")
1929            .into_iter()
1930            .map(|(_, event)| event.kind)
1931            .collect()
1932    }
1933
1934    async fn event_payloads(
1935        log: std::sync::Arc<crate::event_log::AnyEventLog>,
1936        topic: &str,
1937    ) -> Vec<serde_json::Value> {
1938        log.read_range(&Topic::new(topic).expect("valid topic"), None, usize::MAX)
1939            .await
1940            .expect("read topic")
1941            .into_iter()
1942            .map(|(_, event)| event.payload)
1943            .collect()
1944    }
1945
1946    #[tokio::test(flavor = "current_thread")]
1947    async fn ask_user_coerces_to_default_type_and_logs_events() {
1948        tokio::task::LocalSet::new()
1949            .run_until(async {
1950                let dir = tempfile::tempdir().expect("tempdir");
1951                let source = r#"
1952pipeline test(task) {
1953  host_mock("hitl", "question", {answer: "9"})
1954  let answer: int = ask_user("Pick a number", {default: 0})
1955  __io_println(answer)
1956}
1957"#;
1958                let (
1959                    output,
1960                    question_events,
1961                    approval_events,
1962                    dual_control_events,
1963                    escalation_events,
1964                ) = execute_hitl_script(dir.path(), source)
1965                    .await
1966                    .expect("script succeeds");
1967                assert_eq!(output, "9");
1968                assert_eq!(
1969                    question_events,
1970                    vec![
1971                        "hitl.question_asked".to_string(),
1972                        "hitl.response_received".to_string()
1973                    ]
1974                );
1975                assert!(approval_events.is_empty());
1976                assert!(dual_control_events.is_empty());
1977                assert!(escalation_events.is_empty());
1978            })
1979            .await;
1980    }
1981
1982    #[tokio::test(flavor = "current_thread")]
1983    async fn request_approval_waits_for_quorum_and_emits_a_record() {
1984        let _guard = hitl_lock().lock().await;
1985        tokio::task::LocalSet::new()
1986            .run_until(async {
1987                reset_thread_local_state();
1988                let dir = tempfile::tempdir().expect("tempdir");
1989                let source = r#"
1990pipeline test(task) {
1991  host_mock("hitl", "approval", [
1992    {approved: true, reviewer: "alice", reason: "ok"},
1993    {approved: true, reviewer: "bob", reason: "ship it"},
1994  ])
1995  let record = request_approval(
1996    "deploy production",
1997    {quorum: 2, reviewers: ["alice", "bob", "carol"]},
1998  )
1999  __io_println(record.approved)
2000  __io_println(len(record.reviewers))
2001  __io_println(record.reviewers[0])
2002  __io_println(record.reviewers[1])
2003}
2004"#;
2005                let (_, _, approval_events, _, _) = execute_hitl_script(dir.path(), source)
2006                    .await
2007                    .expect("script succeeds");
2008                assert_eq!(
2009                    approval_events,
2010                    vec![
2011                        "hitl.approval_requested".to_string(),
2012                        "hitl.response_received".to_string(),
2013                        "hitl.response_received".to_string(),
2014                        "hitl.approval_approved".to_string(),
2015                    ]
2016                );
2017            })
2018            .await;
2019    }
2020
2021    #[tokio::test(flavor = "current_thread")]
2022    async fn request_approval_emits_canonical_approval_request_payload() {
2023        tokio::task::LocalSet::new()
2024            .run_until(async {
2025                reset_thread_local_state();
2026                let dir = tempfile::tempdir().expect("tempdir");
2027                let log = install_default_for_base_dir(dir.path()).expect("install event log");
2028                let source = r#"
2029pipeline test(task) {
2030  host_mock("hitl", "approval", {approved: true, reviewer: "alice", reason: "ok"})
2031  request_approval("deploy production", {
2032    args: {environment: "prod"},
2033    quorum: 1,
2034    reviewers: ["alice"],
2035    evidence_refs: [{kind: "run", uri: "run_123"}],
2036    undo_metadata: {strategy: "rollback"},
2037    capabilities_requested: ["deploy.production"],
2038  })
2039}
2040"#;
2041                let chunk = compile_source(source).expect("compile source");
2042                let mut vm = Vm::new();
2043                register_vm_stdlib(&mut vm);
2044                vm.set_source_dir(dir.path());
2045                vm.execute(&chunk).await.expect("script succeeds");
2046
2047                let payloads = event_payloads(log, HITL_APPROVALS_TOPIC).await;
2048                let request_payload = &payloads[0]["payload"];
2049                let approval_request = &request_payload["approval_request"];
2050                assert_eq!(approval_request["id"], request_payload["id"]);
2051                assert_eq!(approval_request["action"], "deploy production");
2052                assert_eq!(approval_request["args"]["environment"], "prod");
2053                assert_eq!(approval_request["approvers_required"], 1);
2054                assert_eq!(approval_request["evidence_refs"][0]["uri"], "run_123");
2055                assert_eq!(approval_request["undo_metadata"]["strategy"], "rollback");
2056                assert_eq!(
2057                    approval_request["capabilities_requested"][0],
2058                    "deploy.production"
2059                );
2060                assert!(approval_request["requested_at"].as_str().is_some());
2061                assert!(approval_request["deadline"].as_str().is_some());
2062            })
2063            .await;
2064    }
2065
2066    #[tokio::test(flavor = "current_thread")]
2067    async fn request_approval_surfaces_denials_as_typed_errors() {
2068        let _guard = hitl_lock().lock().await;
2069        tokio::task::LocalSet::new()
2070            .run_until(async {
2071                reset_thread_local_state();
2072                let dir = tempfile::tempdir().expect("tempdir");
2073                let source = r#"
2074pipeline test(task) {
2075  host_mock("hitl", "approval", {approved: false, reviewer: "alice", reason: "unsafe"})
2076  let denied = try {
2077    request_approval("drop table", {reviewers: ["alice"]})
2078  }
2079  __io_println(is_err(denied))
2080  __io_println(unwrap_err(denied).name)
2081  __io_println(unwrap_err(denied).reason)
2082}
2083"#;
2084                let (output, _, approval_events, _, _) = execute_hitl_script(dir.path(), source)
2085                    .await
2086                    .expect("script succeeds");
2087                assert_eq!(output, "true\nApprovalDeniedError\nunsafe");
2088                assert_eq!(
2089                    approval_events,
2090                    vec![
2091                        "hitl.approval_requested".to_string(),
2092                        "hitl.response_received".to_string(),
2093                        "hitl.approval_denied".to_string(),
2094                    ]
2095                );
2096            })
2097            .await;
2098    }
2099
2100    #[tokio::test(flavor = "current_thread")]
2101    async fn dual_control_executes_action_after_quorum() {
2102        tokio::task::LocalSet::new()
2103            .run_until(async {
2104                let dir = tempfile::tempdir().expect("tempdir");
2105                let source = r#"
2106pipeline test(task) {
2107  host_mock("hitl", "dual_control", [
2108    {approved: true, reviewer: "alice"},
2109    {approved: true, reviewer: "bob"},
2110  ])
2111  let result = dual_control(2, 3, { -> "launched" }, ["alice", "bob", "carol"])
2112  __io_println(result)
2113}
2114"#;
2115                let (output, _, _, dual_control_events, _) =
2116                    execute_hitl_script(dir.path(), source)
2117                        .await
2118                        .expect("script succeeds");
2119                assert_eq!(output, "launched");
2120                assert_eq!(
2121                    dual_control_events,
2122                    vec![
2123                        "hitl.dual_control_requested".to_string(),
2124                        "hitl.response_received".to_string(),
2125                        "hitl.response_received".to_string(),
2126                        "hitl.dual_control_approved".to_string(),
2127                        "hitl.dual_control_executed".to_string(),
2128                    ]
2129                );
2130            })
2131            .await;
2132    }
2133
2134    #[tokio::test(flavor = "current_thread")]
2135    async fn escalate_to_waits_for_acceptance_event() {
2136        tokio::task::LocalSet::new()
2137            .run_until(async {
2138                let dir = tempfile::tempdir().expect("tempdir");
2139                let source = r#"
2140pipeline test(task) {
2141  host_mock("hitl", "escalation", {accepted: true, reviewer: "lead", reason: "taking over"})
2142  let handle = escalate_to("admin", "need override")
2143  __io_println(handle.status)
2144  __io_println(handle.reviewer)
2145}
2146"#;
2147                let (output, _, _, _, escalation_events) = execute_hitl_script(dir.path(), source)
2148                    .await
2149                    .expect("script succeeds");
2150                assert_eq!(output, "accepted\nlead");
2151                assert_eq!(
2152                    escalation_events,
2153                    vec![
2154                        "hitl.escalation_issued".to_string(),
2155                        "hitl.escalation_accepted".to_string(),
2156                    ]
2157                );
2158            })
2159            .await;
2160    }
2161
2162    /// `harn-serve` adapters (A2A `input-required`, ACP `hitl_request`)
2163    /// rely on the canonical `AgentEvent::HitlRequested` /
2164    /// `AgentEvent::HitlResolved` pair to bracket every HITL pause.
2165    /// Pin the contract here so future HITL primitives keep emitting
2166    /// the event around their waitpoint blocks.
2167    #[tokio::test(flavor = "current_thread")]
2168    async fn ask_user_emits_hitl_request_and_resolution_to_agent_event_sinks() {
2169        use std::sync::Mutex as StdMutex;
2170
2171        tokio::task::LocalSet::new()
2172            .run_until(async {
2173                let dir = tempfile::tempdir().expect("tempdir");
2174                let session_id = "hitl-session".to_string();
2175                let captured: std::sync::Arc<StdMutex<Vec<crate::agent_events::AgentEvent>>> =
2176                    std::sync::Arc::new(StdMutex::new(Vec::new()));
2177
2178                struct CaptureSink(std::sync::Arc<StdMutex<Vec<crate::agent_events::AgentEvent>>>);
2179                impl crate::agent_events::AgentEventSink for CaptureSink {
2180                    fn handle_event(&self, event: &crate::agent_events::AgentEvent) {
2181                        self.0.lock().expect("captured").push(event.clone());
2182                    }
2183                }
2184
2185                // Inline the script setup rather than using the
2186                // `execute_hitl_script` helper: that helper calls
2187                // `reset_thread_local_state` (which wipes the session
2188                // store), so any session pushed before it would be
2189                // gone by the time `ask_user` runs.
2190                crate::reset_thread_local_state();
2191                crate::event_log::install_default_for_base_dir(dir.path())
2192                    .expect("install event log");
2193
2194                crate::agent_events::reset_all_sinks();
2195                let sink: std::sync::Arc<dyn crate::agent_events::AgentEventSink> =
2196                    std::sync::Arc::new(CaptureSink(captured.clone()));
2197                crate::agent_events::register_sink(session_id.clone(), sink);
2198                crate::agent_sessions::open_or_create(Some(session_id.clone()));
2199                let _guard = crate::agent_sessions::enter_current_session(session_id.clone());
2200
2201                let source = r#"
2202pipeline test(task) {
2203  host_mock("hitl", "question", {answer: "ok"})
2204  let answer: string = ask_user("Are you sure?", {default: "no"})
2205  __io_println(answer)
2206}
2207"#;
2208                let chunk = crate::compile_source(source).expect("compile source");
2209                let mut vm = Vm::new();
2210                register_vm_stdlib(&mut vm);
2211                vm.set_source_dir(dir.path());
2212                vm.execute(&chunk).await.expect("script runs");
2213                assert_eq!(vm.output().trim_end(), "ok");
2214
2215                let events = captured.lock().expect("captured");
2216                let mut iter = events.iter().filter(|event| {
2217                    matches!(
2218                        event,
2219                        crate::agent_events::AgentEvent::HitlRequested { .. }
2220                            | crate::agent_events::AgentEvent::HitlResolved { .. }
2221                    )
2222                });
2223                let requested = iter.next().expect("HitlRequested emitted");
2224                let resolved = iter.next().expect("HitlResolved emitted");
2225                assert!(iter.next().is_none(), "exactly one pair: {events:?}");
2226
2227                let crate::agent_events::AgentEvent::HitlRequested {
2228                    session_id: req_session,
2229                    request_id: req_id,
2230                    kind: req_kind,
2231                    payload,
2232                } = requested
2233                else {
2234                    panic!("expected HitlRequested, got: {requested:?}");
2235                };
2236                assert_eq!(req_session, &session_id);
2237                assert_eq!(req_kind, "question");
2238                assert!(req_id.starts_with("hitl_question_"));
2239                assert_eq!(payload["prompt"], "Are you sure?");
2240
2241                let crate::agent_events::AgentEvent::HitlResolved {
2242                    request_id: res_id,
2243                    kind: res_kind,
2244                    outcome,
2245                    ..
2246                } = resolved
2247                else {
2248                    panic!("expected HitlResolved, got: {resolved:?}");
2249                };
2250                assert_eq!(res_id, req_id);
2251                assert_eq!(res_kind, "question");
2252                assert_eq!(outcome, "answered");
2253
2254                drop(_guard);
2255                crate::agent_events::reset_all_sinks();
2256            })
2257            .await;
2258    }
2259}