1use crate::value::VmDictExt;
2use std::cell::RefCell;
3use std::collections::{BTreeMap, BTreeSet};
4use std::path::Path;
5use std::sync::Arc;
6use std::time::Duration as StdDuration;
7
8use serde::{Deserialize, Serialize};
9use serde_json::{json, Value as JsonValue};
10use sha2::Digest;
11use time::format_description::well_known::Rfc3339;
12use time::OffsetDateTime;
13use uuid::Uuid;
14
15use crate::event_log::{
16 active_event_log, install_default_for_base_dir, install_memory_for_current_thread, AnyEventLog,
17 EventLog, LogEvent, Topic,
18};
19use crate::runtime_limits::RuntimeLimits;
20use crate::schema::schema_expect_value;
21use crate::stdlib::host::dispatch_mock_host_call;
22use crate::stdlib::macros::{harn_builtin, BuiltinSignature, Param, VmBuiltinDef, TY_ANY, TY_DICT};
23use crate::stdlib::options::{duration_from_value, ErrorKind};
24use crate::stdlib::waitpoint::{
25 cancel_waitpoint_on, complete_waitpoint_on, create_waitpoint_on, inspect_waitpoint_on,
26 wait_on_waitpoints, WaitpointRecord, WaitpointStatus, WaitpointWaitFailure,
27 WaitpointWaitOptions,
28};
29use crate::triggers::dispatcher::current_dispatch_context;
30use crate::value::{categorized_error, ErrorCategory, VmError, VmValue};
31use crate::vm::{AsyncBuiltinCtx, Vm};
32
33const HITL_EVENT_LOG_QUEUE_DEPTH: usize = RuntimeLimits::DEFAULT.default_event_log_queue_depth;
34const HITL_APPROVAL_TIMEOUT_MS: u64 = 24 * 60 * 60 * 1000;
35const HITL_QUESTION_TIMEOUT_MS: u64 = 24 * 60 * 60 * 1000;
36
37pub const HITL_QUESTIONS_TOPIC: &str = "hitl.questions";
38pub const HITL_APPROVALS_TOPIC: &str = "hitl.approvals";
39pub const HITL_DUAL_CONTROL_TOPIC: &str = "hitl.dual_control";
40pub const HITL_ESCALATIONS_TOPIC: &str = "hitl.escalations";
41
42thread_local! {
43 static REQUEST_SEQUENCE: RefCell<RequestSequenceState> = RefCell::new(RequestSequenceState::default());
44}
45
46#[derive(Default)]
47pub(crate) struct RequestSequenceState {
48 pub(crate) instance_key: String,
49 pub(crate) next_seq: u64,
50}
51
52#[derive(Clone, Copy, Debug, PartialEq, Eq, Serialize, Deserialize)]
53#[serde(rename_all = "snake_case")]
54pub enum HitlRequestKind {
55 Question,
56 Approval,
57 DualControl,
58 Escalation,
59}
60
61impl HitlRequestKind {
62 pub(crate) fn as_str(self) -> &'static str {
63 match self {
64 Self::Question => "question",
65 Self::Approval => "approval",
66 Self::DualControl => "dual_control",
67 Self::Escalation => "escalation",
68 }
69 }
70
71 fn topic(self) -> &'static str {
72 match self {
73 Self::Question => HITL_QUESTIONS_TOPIC,
74 Self::Approval => HITL_APPROVALS_TOPIC,
75 Self::DualControl => HITL_DUAL_CONTROL_TOPIC,
76 Self::Escalation => HITL_ESCALATIONS_TOPIC,
77 }
78 }
79
80 fn request_event_kind(self) -> &'static str {
81 match self {
82 Self::Question => "hitl.question_asked",
83 Self::Approval => "hitl.approval_requested",
84 Self::DualControl => "hitl.dual_control_requested",
85 Self::Escalation => "hitl.escalation_issued",
86 }
87 }
88
89 pub(crate) fn from_request_id(request_id: &str) -> Option<Self> {
90 if request_id.starts_with("hitl_question_") {
91 Some(Self::Question)
92 } else if request_id.starts_with("hitl_approval_") {
93 Some(Self::Approval)
94 } else if request_id.starts_with("hitl_dual_control_") {
95 Some(Self::DualControl)
96 } else if request_id.starts_with("hitl_escalation_") {
97 Some(Self::Escalation)
98 } else {
99 None
100 }
101 }
102}
103
104#[derive(Clone, Debug, Serialize, Deserialize)]
105pub struct HitlHostResponse {
106 pub request_id: String,
107 #[serde(skip_serializing_if = "Option::is_none")]
108 pub answer: Option<JsonValue>,
109 #[serde(skip_serializing_if = "Option::is_none")]
110 pub approved: Option<bool>,
111 #[serde(skip_serializing_if = "Option::is_none")]
112 pub accepted: Option<bool>,
113 #[serde(skip_serializing_if = "Option::is_none")]
114 pub reviewer: Option<String>,
115 #[serde(skip_serializing_if = "Option::is_none")]
116 pub reason: Option<String>,
117 #[serde(skip_serializing_if = "Option::is_none")]
118 pub metadata: Option<JsonValue>,
119 #[serde(skip_serializing_if = "Option::is_none")]
120 pub responded_at: Option<String>,
121 #[serde(skip_serializing_if = "Option::is_none")]
122 pub signature: Option<String>,
123}
124
125#[derive(Clone, Debug, Serialize, Deserialize)]
126struct HitlRequestEnvelope {
127 request_id: String,
128 kind: HitlRequestKind,
129 #[serde(default)]
130 agent: String,
131 trace_id: String,
132 #[serde(skip_serializing_if = "Option::is_none")]
133 run_id: Option<String>,
134 requested_at: String,
135 payload: JsonValue,
136}
137
138#[derive(Clone, Debug, Serialize, Deserialize)]
139struct HitlTimeoutRecord {
140 request_id: String,
141 kind: HitlRequestKind,
142 trace_id: String,
143 timed_out_at: String,
144}
145
146#[derive(Clone, Debug, Serialize, Deserialize, PartialEq, Eq)]
147pub struct ApprovalRequest {
148 pub id: String,
149 pub action: String,
150 #[serde(default)]
151 pub args: JsonValue,
152 pub principal: String,
153 pub requested_at: String,
154 #[serde(skip_serializing_if = "Option::is_none")]
155 pub deadline: Option<String>,
156 pub approvers_required: u32,
157 #[serde(default)]
158 pub evidence_refs: Vec<JsonValue>,
159 #[serde(default)]
160 pub undo_metadata: JsonValue,
161 #[serde(default)]
162 pub capabilities_requested: Vec<String>,
163}
164
165impl ApprovalRequest {
166 pub fn new(
167 id: impl Into<String>,
168 action: impl Into<String>,
169 args: JsonValue,
170 principal: impl Into<String>,
171 requested_at: impl Into<String>,
172 ) -> Self {
173 Self {
174 id: id.into(),
175 action: action.into(),
176 args,
177 principal: principal.into(),
178 requested_at: requested_at.into(),
179 deadline: None,
180 approvers_required: 1,
181 evidence_refs: Vec::new(),
182 undo_metadata: JsonValue::Null,
183 capabilities_requested: Vec::new(),
184 }
185 }
186}
187
188pub(crate) fn approval_request_for_host_permission(
189 id: impl Into<String>,
190 action: impl Into<String>,
191 args: JsonValue,
192 principal: impl Into<String>,
193 evidence_refs: Vec<JsonValue>,
194 undo_metadata: JsonValue,
195 capabilities_requested: Vec<String>,
196) -> ApprovalRequest {
197 let mut request = ApprovalRequest::new(id, action, args, principal, now_rfc3339());
198 request.evidence_refs = evidence_refs;
199 request.undo_metadata = undo_metadata;
200 request.capabilities_requested = capabilities_requested;
201 request
202}
203
204#[derive(Clone, Debug)]
205struct DispatchKeys {
206 instance_key: String,
207 stable_base: String,
208 agent: String,
209 trace_id: String,
210}
211
212#[derive(Clone, Debug)]
213struct AskUserOptions {
214 schema: Option<VmValue>,
215 timeout: Option<StdDuration>,
216 default: Option<VmValue>,
217}
218
219#[derive(Clone, Debug)]
220struct ApprovalOptions {
221 detail: Option<VmValue>,
222 args: Option<VmValue>,
223 quorum: u32,
224 reviewers: Vec<String>,
225 deadline: StdDuration,
226 principal: Option<String>,
227 evidence_refs: Vec<JsonValue>,
228 undo_metadata: Option<JsonValue>,
229 capabilities_requested: Vec<String>,
230}
231
232#[derive(Clone, Debug)]
233struct ApprovalProgress {
234 request_id: String,
235 reviewers: BTreeSet<String>,
236 signatures: Vec<ApprovalSignature>,
237 reason: Option<String>,
238 approved_at: Option<String>,
239}
240
241#[derive(Clone, Debug, Serialize)]
242struct ApprovalSignature {
243 reviewer: String,
244 signed_at: String,
245 signature: String,
246}
247
248#[derive(Clone, Debug)]
249enum ApprovalResolution {
250 Pending,
251 Approved(ApprovalProgress),
252 Denied(HitlHostResponse),
253}
254
255#[allow(clippy::large_enum_variant)]
263#[derive(Clone, Debug)]
264enum WaitpointOutcome {
265 Completed(WaitpointRecord),
266 Timeout,
267 Cancelled {
268 wait_id: String,
269 waitpoint_ids: Vec<String>,
270 reason: Option<String>,
271 },
272}
273
274pub(crate) fn register_hitl_builtins(vm: &mut Vm) {
275 for def in MODULE_BUILTINS {
276 vm.register_builtin_def(def);
277 }
278}
279
280pub(crate) const MODULE_BUILTINS: &[&VmBuiltinDef] = &[
281 &ASK_USER_BUILTIN_DEF,
282 &REQUEST_APPROVAL_BUILTIN_DEF,
283 &DUAL_CONTROL_BUILTIN_DEF,
284 &ESCALATE_TO_BUILTIN_DEF,
285];
286
287#[harn_builtin(
288 sig = "ask_user(prompt: string, options?: dict) -> any",
289 kind = "async",
290 category = "hitl"
291)]
292async fn ask_user_builtin(
293 ctx: crate::vm::AsyncBuiltinCtx,
294 args: Vec<VmValue>,
295) -> Result<VmValue, VmError> {
296 ask_user_impl(Some(&ctx), &args).await
297}
298
299#[harn_builtin(
300 sig_expr = BuiltinSignature::variadic("request_approval", &[Param::new("args", TY_ANY)], TY_DICT),
301 kind = "async",
302 category = "hitl"
303)]
304async fn request_approval_builtin(
305 ctx: crate::vm::AsyncBuiltinCtx,
306 args: Vec<VmValue>,
307) -> Result<VmValue, VmError> {
308 request_approval_impl(Some(&ctx), &args).await
309}
310
311#[harn_builtin(
312 sig = "dual_control(n: int, m: int, action: closure, approvers?: list) -> dict",
313 kind = "async",
314 category = "hitl"
315)]
316async fn dual_control_builtin(
317 ctx: crate::vm::AsyncBuiltinCtx,
318 args: Vec<VmValue>,
319) -> Result<VmValue, VmError> {
320 dual_control_impl(&ctx, &args).await
321}
322
323#[harn_builtin(
324 sig = "escalate_to(role: string, reason: string) -> dict",
325 kind = "async",
326 category = "hitl"
327)]
328async fn escalate_to_builtin(
329 ctx: crate::vm::AsyncBuiltinCtx,
330 args: Vec<VmValue>,
331) -> Result<VmValue, VmError> {
332 escalate_to_impl(Some(&ctx), &args).await
333}
334
335pub(crate) fn reset_hitl_state() {
336 REQUEST_SEQUENCE.with(|slot| {
337 *slot.borrow_mut() = RequestSequenceState::default();
338 });
339}
340
341pub(crate) fn take_hitl_state() -> RequestSequenceState {
342 REQUEST_SEQUENCE.with(|slot| std::mem::take(&mut *slot.borrow_mut()))
343}
344
345pub(crate) fn restore_hitl_state(state: RequestSequenceState) {
346 REQUEST_SEQUENCE.with(|slot| {
347 *slot.borrow_mut() = state;
348 });
349}
350
351pub async fn append_hitl_response(
352 base_dir: Option<&Path>,
353 mut response: HitlHostResponse,
354) -> Result<u64, String> {
355 let kind = HitlRequestKind::from_request_id(&response.request_id)
356 .ok_or_else(|| format!("unknown HITL request id '{}'", response.request_id))?;
357 if response.responded_at.is_none() {
358 response.responded_at = Some(now_rfc3339());
359 }
360 let log = ensure_hitl_event_log_for(base_dir)?;
361 let headers = response_headers(&response.request_id);
362 let topic = Topic::new(kind.topic()).map_err(|error| error.to_string())?;
363 let event_id = log
364 .append(
365 &topic,
366 LogEvent::new(
367 match kind {
368 HitlRequestKind::Escalation => "hitl.escalation_accepted",
369 _ => "hitl.response_received",
370 },
371 serde_json::to_value(&response).map_err(|error| error.to_string())?,
372 )
373 .with_headers(headers),
374 )
375 .await
376 .map_err(|error| error.to_string())?;
377 finalize_hitl_response(&log, kind, &response).await?;
378 Ok(event_id)
379}
380
381pub async fn append_approval_request_on(
382 log: &Arc<AnyEventLog>,
383 agent: impl Into<String>,
384 trace_id: impl Into<String>,
385 action: impl Into<String>,
386 detail: JsonValue,
387 reviewers: Vec<String>,
388) -> Result<String, VmError> {
389 let request_id = next_request_id(HitlRequestKind::Approval, current_dispatch_keys().as_ref());
390 let trace_id = trace_id.into();
391 let agent = agent.into();
392 let requested_at_time = OffsetDateTime::now_utc();
393 let requested_at = format_rfc3339(requested_at_time);
394 let mut approval_request = ApprovalRequest::new(
395 request_id.clone(),
396 action.into(),
397 detail.clone(),
398 agent.clone(),
399 requested_at.clone(),
400 );
401 approval_request.deadline = deadline_after(
402 requested_at_time,
403 StdDuration::from_millis(HITL_APPROVAL_TIMEOUT_MS),
404 );
405 approval_request.approvers_required = 1;
406 let approval_request_json = serde_json::to_value(&approval_request)
407 .map_err(|error| VmError::Runtime(error.to_string()))?;
408 let request = HitlRequestEnvelope {
409 request_id: request_id.clone(),
410 kind: HitlRequestKind::Approval,
411 agent,
412 trace_id: trace_id.clone(),
413 run_id: None,
414 requested_at: requested_at.clone(),
415 payload: json!({
416 "approval_request": approval_request_json,
417 "id": approval_request.id,
418 "action": approval_request.action,
419 "args": approval_request.args,
420 "principal": approval_request.principal,
421 "requested_at": requested_at,
422 "deadline": approval_request.deadline,
423 "approvers_required": approval_request.approvers_required,
424 "evidence_refs": approval_request.evidence_refs,
425 "undo_metadata": approval_request.undo_metadata,
426 "capabilities_requested": approval_request.capabilities_requested,
427 "detail": detail,
428 "quorum": 1,
429 "reviewers": reviewers,
430 "deadline_ms": HITL_APPROVAL_TIMEOUT_MS,
431 }),
432 };
433 create_request_waitpoint(log, &request).await?;
434 append_request(log, &request).await?;
435 maybe_notify_host(None, &request);
436 Ok(request_id)
437}
438
439async fn ask_user_impl(
440 ctx: Option<&AsyncBuiltinCtx>,
441 args: &[VmValue],
442) -> Result<VmValue, VmError> {
443 let prompt = required_string_arg(args, 0, "ask_user")?;
444 let options = parse_ask_user_options(args.get(1))?;
445 let keys = current_dispatch_keys();
446 let request_id = next_request_id(HitlRequestKind::Question, keys.as_ref());
447 let trace_id = keys
448 .as_ref()
449 .map(|keys| keys.trace_id.clone())
450 .unwrap_or_else(new_trace_id);
451 let log = ensure_hitl_event_log();
452 let request = HitlRequestEnvelope {
453 request_id: request_id.clone(),
454 kind: HitlRequestKind::Question,
455 agent: keys
456 .as_ref()
457 .map(|keys| keys.agent.clone())
458 .unwrap_or_default(),
459 trace_id: trace_id.clone(),
460 run_id: crate::orchestration::current_mutation_session().and_then(|session| session.run_id),
461 requested_at: now_rfc3339(),
462 payload: json!({
463 "prompt": prompt,
464 "schema": options.schema.as_ref().map(crate::llm::vm_value_to_json),
465 "default": options.default.as_ref().map(crate::llm::vm_value_to_json),
466 "timeout_ms": options.timeout.map(|timeout| timeout.as_millis() as u64),
467 }),
468 };
469 create_request_waitpoint(&log, &request).await?;
470 append_request(&log, &request).await?;
471 maybe_notify_host(ctx, &request);
472 emit_hitl_requested(&request);
473 maybe_apply_mock_response(HitlRequestKind::Question, &request_id, &request.payload).await?;
474
475 match wait_for_request_waitpoint_with_events(
476 &request_id,
477 HitlRequestKind::Question,
478 options.timeout,
479 )
480 .await?
481 {
482 WaitpointOutcome::Completed(record) => {
483 let answer = record
484 .value
485 .as_ref()
486 .map(crate::stdlib::json_to_vm_value)
487 .unwrap_or(VmValue::Nil);
488 if let Some(schema) = options.schema.as_ref() {
489 return schema_expect_value(&answer, schema, true);
490 }
491 if let Some(default) = options.default.as_ref() {
492 return Ok(coerce_like_default(&answer, default));
493 }
494 Ok(answer)
495 }
496 WaitpointOutcome::Timeout => {
497 append_timeout_once(&log, HitlRequestKind::Question, &request_id, &trace_id).await?;
498 if let Some(default) = options.default {
499 return Ok(default);
500 }
501 Err(timeout_error(&request_id, HitlRequestKind::Question))
502 }
503 WaitpointOutcome::Cancelled {
504 wait_id,
505 waitpoint_ids,
506 reason,
507 } => Err(hitl_cancelled_error(
508 &request_id,
509 HitlRequestKind::Question,
510 &wait_id,
511 &waitpoint_ids,
512 reason,
513 )),
514 }
515}
516
517async fn request_approval_impl(
518 ctx: Option<&AsyncBuiltinCtx>,
519 args: &[VmValue],
520) -> Result<VmValue, VmError> {
521 let action = required_string_arg(args, 0, "request_approval")?;
522 let options = parse_approval_options(args.get(1), "request_approval")?;
523 let keys = current_dispatch_keys();
524 let request_id = next_request_id(HitlRequestKind::Approval, keys.as_ref());
525 let trace_id = keys
526 .as_ref()
527 .map(|keys| keys.trace_id.clone())
528 .unwrap_or_else(new_trace_id);
529 let agent = keys
530 .as_ref()
531 .map(|keys| keys.agent.clone())
532 .unwrap_or_default();
533 let requested_at_time = OffsetDateTime::now_utc();
534 let requested_at = format_rfc3339(requested_at_time);
535 let principal = options.principal.clone().unwrap_or_else(|| agent.clone());
536 let approval_args = options
537 .args
538 .as_ref()
539 .or(options.detail.as_ref())
540 .map(crate::llm::vm_value_to_json)
541 .unwrap_or(JsonValue::Null);
542 let mut approval_request = ApprovalRequest::new(
543 request_id.clone(),
544 action.clone(),
545 approval_args,
546 principal,
547 requested_at.clone(),
548 );
549 approval_request.deadline = deadline_after(requested_at_time, options.deadline);
550 approval_request.approvers_required = options.quorum;
551 approval_request.evidence_refs = options.evidence_refs.clone();
552 approval_request.undo_metadata = options
553 .undo_metadata
554 .clone()
555 .or_else(|| {
556 crate::orchestration::current_mutation_session()
557 .and_then(|session| serde_json::to_value(session).ok())
558 })
559 .unwrap_or(JsonValue::Null);
560 approval_request.capabilities_requested = options.capabilities_requested.clone();
561 let approval_request_json = serde_json::to_value(&approval_request)
562 .map_err(|error| VmError::Runtime(error.to_string()))?;
563 let log = ensure_hitl_event_log();
564 let request = HitlRequestEnvelope {
565 request_id: request_id.clone(),
566 kind: HitlRequestKind::Approval,
567 agent,
568 trace_id: trace_id.clone(),
569 run_id: crate::orchestration::current_mutation_session().and_then(|session| session.run_id),
570 requested_at: requested_at.clone(),
571 payload: json!({
572 "approval_request": approval_request_json,
573 "id": approval_request.id,
574 "action": action,
575 "args": approval_request.args,
576 "principal": approval_request.principal,
577 "requested_at": requested_at,
578 "deadline": approval_request.deadline,
579 "approvers_required": approval_request.approvers_required,
580 "evidence_refs": approval_request.evidence_refs,
581 "undo_metadata": approval_request.undo_metadata,
582 "capabilities_requested": approval_request.capabilities_requested,
583 "detail": options.detail.as_ref().map(crate::llm::vm_value_to_json),
584 "quorum": options.quorum,
585 "reviewers": options.reviewers,
586 "deadline_ms": options.deadline.as_millis() as u64,
587 }),
588 };
589 create_request_waitpoint(&log, &request).await?;
590 append_request(&log, &request).await?;
591 maybe_notify_host(ctx, &request);
592 emit_hitl_requested(&request);
593 maybe_apply_mock_response(HitlRequestKind::Approval, &request_id, &request.payload).await?;
594
595 match wait_for_request_waitpoint_with_events(
596 &request_id,
597 HitlRequestKind::Approval,
598 Some(options.deadline),
599 )
600 .await?
601 {
602 WaitpointOutcome::Completed(record) => {
603 approval_record_from_waitpoint(&record, "request_approval")
604 }
605 WaitpointOutcome::Timeout => {
606 append_timeout_once(&log, HitlRequestKind::Approval, &request_id, &trace_id).await?;
607 Err(timeout_error(&request_id, HitlRequestKind::Approval))
608 }
609 WaitpointOutcome::Cancelled { .. } => {
610 Err(approval_wait_error(&log, HitlRequestKind::Approval, &request_id).await)
611 }
612 }
613}
614
615pub(crate) async fn request_approval_for_side_effect(
616 action: &str,
617 detail: JsonValue,
618 principal: String,
619 reviewers: Vec<String>,
620 capabilities_requested: Vec<String>,
621) -> Result<VmValue, VmError> {
622 let mut options = crate::value::DictMap::new();
623 options.insert("args".to_string(), crate::stdlib::json_to_vm_value(&detail));
624 options.insert(
625 "detail".to_string(),
626 crate::stdlib::json_to_vm_value(&detail),
627 );
628 options.put_str("principal", principal);
629 options.insert(
630 "reviewers".to_string(),
631 VmValue::List(std::sync::Arc::new(
632 reviewers
633 .into_iter()
634 .map(|reviewer| VmValue::String(std::sync::Arc::from(reviewer)))
635 .collect(),
636 )),
637 );
638 options.insert(
639 "capabilities_requested".to_string(),
640 VmValue::List(std::sync::Arc::new(
641 capabilities_requested
642 .into_iter()
643 .map(|capability| VmValue::String(std::sync::Arc::from(capability)))
644 .collect(),
645 )),
646 );
647 let args = vec![
648 VmValue::String(std::sync::Arc::from(action.to_string())),
649 VmValue::dict(options),
650 ];
651 request_approval_impl(None, &args).await
652}
653
654async fn dual_control_impl(ctx: &AsyncBuiltinCtx, args: &[VmValue]) -> Result<VmValue, VmError> {
655 let n = required_positive_int_arg(args, 0, "dual_control")?;
656 let m = required_positive_int_arg(args, 1, "dual_control")?;
657 if n > m {
658 return Err(VmError::Runtime(
659 "dual_control: n must be less than or equal to m".to_string(),
660 ));
661 }
662 let action = args
663 .get(2)
664 .and_then(|value| match value {
665 VmValue::Closure(closure) => Some(closure.clone()),
666 _ => None,
667 })
668 .ok_or_else(|| VmError::Runtime("dual_control: action must be a closure".to_string()))?;
669 let approvers = optional_string_list(args.get(3), "dual_control")?;
670 if !approvers.is_empty() && approvers.len() < m as usize {
671 return Err(VmError::Runtime(format!(
672 "dual_control: expected at least {m} approvers, got {}",
673 approvers.len()
674 )));
675 }
676
677 let keys = current_dispatch_keys();
678 let request_id = next_request_id(HitlRequestKind::DualControl, keys.as_ref());
679 let trace_id = keys
680 .as_ref()
681 .map(|keys| keys.trace_id.clone())
682 .unwrap_or_else(new_trace_id);
683 let action_name = if action.func.name.is_empty() {
684 "anonymous".to_string()
685 } else {
686 action.func.name.clone()
687 };
688 let agent = keys
689 .as_ref()
690 .map(|keys| keys.agent.clone())
691 .unwrap_or_default();
692 let requested_at_time = OffsetDateTime::now_utc();
693 let requested_at = format_rfc3339(requested_at_time);
694 let mut approval_request = ApprovalRequest::new(
695 request_id.clone(),
696 action_name.clone(),
697 json!({
698 "n": n,
699 "m": m,
700 "approvers": approvers.clone(),
701 }),
702 agent.clone(),
703 requested_at.clone(),
704 );
705 approval_request.deadline = deadline_after(
706 requested_at_time,
707 StdDuration::from_millis(HITL_APPROVAL_TIMEOUT_MS),
708 );
709 approval_request.approvers_required = n as u32;
710 approval_request.undo_metadata = crate::orchestration::current_mutation_session()
711 .and_then(|session| serde_json::to_value(session).ok())
712 .unwrap_or(JsonValue::Null);
713 let approval_request_json = serde_json::to_value(&approval_request)
714 .map_err(|error| VmError::Runtime(error.to_string()))?;
715 let log = ensure_hitl_event_log();
716 let request = HitlRequestEnvelope {
717 request_id: request_id.clone(),
718 kind: HitlRequestKind::DualControl,
719 agent,
720 trace_id: trace_id.clone(),
721 run_id: crate::orchestration::current_mutation_session().and_then(|session| session.run_id),
722 requested_at: requested_at.clone(),
723 payload: json!({
724 "approval_request": approval_request_json,
725 "id": approval_request.id,
726 "args": approval_request.args,
727 "principal": approval_request.principal,
728 "requested_at": requested_at,
729 "deadline": approval_request.deadline,
730 "approvers_required": approval_request.approvers_required,
731 "evidence_refs": approval_request.evidence_refs,
732 "undo_metadata": approval_request.undo_metadata,
733 "capabilities_requested": approval_request.capabilities_requested,
734 "n": n,
735 "m": m,
736 "action": action_name,
737 "approvers": approvers,
738 "deadline_ms": HITL_APPROVAL_TIMEOUT_MS,
739 }),
740 };
741 create_request_waitpoint(&log, &request).await?;
742 append_request(&log, &request).await?;
743 maybe_notify_host(Some(ctx), &request);
744 emit_hitl_requested(&request);
745 maybe_apply_mock_response(HitlRequestKind::DualControl, &request_id, &request.payload).await?;
746
747 match wait_for_request_waitpoint_with_events(
748 &request_id,
749 HitlRequestKind::DualControl,
750 Some(StdDuration::from_millis(HITL_APPROVAL_TIMEOUT_MS)),
751 )
752 .await?
753 {
754 WaitpointOutcome::Completed(record) => {
755 let _ = approval_record_from_waitpoint(&record, "dual_control")?;
756 let mut vm = ctx.child_vm();
757 let result = vm.call_closure_pub(&action, &[]).await?;
758 ctx.forward_output(&vm.take_output());
759
760 append_named_event(
761 &log,
762 HitlRequestKind::DualControl,
763 "hitl.dual_control_executed",
764 &request_id,
765 &trace_id,
766 json!({
767 "request_id": request_id,
768 "result": crate::llm::vm_value_to_json(&result),
769 }),
770 )
771 .await?;
772
773 Ok(result)
774 }
775 WaitpointOutcome::Timeout => {
776 append_timeout_once(&log, HitlRequestKind::DualControl, &request_id, &trace_id).await?;
777 Err(timeout_error(&request_id, HitlRequestKind::DualControl))
778 }
779 WaitpointOutcome::Cancelled { .. } => {
780 Err(approval_wait_error(&log, HitlRequestKind::DualControl, &request_id).await)
781 }
782 }
783}
784
785async fn escalate_to_impl(
786 ctx: Option<&AsyncBuiltinCtx>,
787 args: &[VmValue],
788) -> Result<VmValue, VmError> {
789 let role = required_string_arg(args, 0, "escalate_to")?;
790 let reason = required_string_arg(args, 1, "escalate_to")?;
791 let keys = current_dispatch_keys();
792 let request_id = next_request_id(HitlRequestKind::Escalation, keys.as_ref());
793 let trace_id = keys
794 .as_ref()
795 .map(|keys| keys.trace_id.clone())
796 .unwrap_or_else(new_trace_id);
797 let log = ensure_hitl_event_log();
798 let request = HitlRequestEnvelope {
799 request_id: request_id.clone(),
800 kind: HitlRequestKind::Escalation,
801 agent: keys
802 .as_ref()
803 .map(|keys| keys.agent.clone())
804 .unwrap_or_default(),
805 trace_id: trace_id.clone(),
806 run_id: crate::orchestration::current_mutation_session().and_then(|session| session.run_id),
807 requested_at: now_rfc3339(),
808 payload: json!({
809 "role": role,
810 "reason": reason,
811 "capability_policy": escalation_capability_policy(),
812 }),
813 };
814 create_request_waitpoint(&log, &request).await?;
815 append_request(&log, &request).await?;
816 maybe_notify_host(ctx, &request);
817 emit_hitl_requested(&request);
818 maybe_apply_mock_response(HitlRequestKind::Escalation, &request_id, &request.payload).await?;
819
820 match wait_for_request_waitpoint_with_events(&request_id, HitlRequestKind::Escalation, None)
821 .await?
822 {
823 WaitpointOutcome::Completed(record) => {
824 let accepted_at = record.completed_at.clone();
825 let reviewer = record.completed_by.clone();
826 let accepted = record
827 .value
828 .as_ref()
829 .and_then(|value| value.get("accepted"))
830 .and_then(JsonValue::as_bool)
831 .unwrap_or(true);
832 Ok(crate::stdlib::json_to_vm_value(&json!({
833 "request_id": request_id,
834 "role": role,
835 "reason": reason,
836 "trace_id": trace_id,
837 "status": if accepted { "accepted" } else { "pending" },
838 "accepted_at": accepted_at,
839 "reviewer": reviewer,
840 })))
841 }
842 WaitpointOutcome::Timeout => Err(timeout_error(&request_id, HitlRequestKind::Escalation)),
843 WaitpointOutcome::Cancelled {
844 wait_id,
845 waitpoint_ids,
846 reason,
847 } => Err(hitl_cancelled_error(
848 &request_id,
849 HitlRequestKind::Escalation,
850 &wait_id,
851 &waitpoint_ids,
852 reason,
853 )),
854 }
855}
856
857async fn create_request_waitpoint(
858 log: &Arc<AnyEventLog>,
859 request: &HitlRequestEnvelope,
860) -> Result<(), VmError> {
861 create_waitpoint_on(
862 log,
863 Some(request.request_id.clone()),
864 Some(json!({
865 "kind": request.kind.as_str(),
866 "agent": request.agent.clone(),
867 "trace_id": request.trace_id.clone(),
868 "requested_at": request.requested_at.clone(),
869 "payload": request.payload.clone(),
870 })),
871 )
872 .await?;
873 Ok(())
874}
875
876async fn wait_for_request_waitpoint(
877 request_id: &str,
878 timeout: Option<StdDuration>,
879) -> Result<WaitpointOutcome, VmError> {
880 match wait_on_waitpoints(
881 vec![request_id.to_string()],
882 WaitpointWaitOptions { timeout },
883 )
884 .await
885 {
886 Ok(records) => Ok(WaitpointOutcome::Completed(
887 records
888 .into_iter()
889 .next()
890 .expect("single waitpoint wait result"),
891 )),
892 Err(WaitpointWaitFailure::Timeout { .. }) => Ok(WaitpointOutcome::Timeout),
893 Err(WaitpointWaitFailure::Cancelled {
894 wait_id,
895 waitpoint_ids,
896 reason,
897 }) => Ok(WaitpointOutcome::Cancelled {
898 wait_id,
899 waitpoint_ids,
900 reason,
901 }),
902 Err(WaitpointWaitFailure::Vm(error)) => {
903 if let Some(outcome) = waitpoint_outcome_from_vm_error(&error) {
904 return Ok(outcome);
905 }
906 Err(error)
907 }
908 }
909}
910
911fn waitpoint_outcome_from_vm_error(error: &VmError) -> Option<WaitpointOutcome> {
912 let VmError::Thrown(VmValue::Dict(dict)) = error else {
913 return None;
914 };
915 let name = dict.get("name").and_then(vm_string)?;
916 match name {
917 "WaitpointTimeoutError" => Some(WaitpointOutcome::Timeout),
918 "WaitpointCancelledError" => Some(WaitpointOutcome::Cancelled {
919 wait_id: dict
920 .get("wait_id")
921 .and_then(vm_string)
922 .unwrap_or_default()
923 .to_string(),
924 waitpoint_ids: dict
925 .get("waitpoint_ids")
926 .and_then(vm_string_list)
927 .unwrap_or_default(),
928 reason: dict
929 .get("reason")
930 .and_then(vm_string)
931 .map(ToString::to_string),
932 }),
933 _ => None,
934 }
935}
936
937async fn finalize_hitl_response(
938 log: &Arc<AnyEventLog>,
939 kind: HitlRequestKind,
940 response: &HitlHostResponse,
941) -> Result<(), String> {
942 match kind {
943 HitlRequestKind::Question => {
944 if waitpoint_is_terminal(log, &response.request_id).await? {
945 return Ok(());
946 }
947 complete_waitpoint_on(
948 log,
949 &response.request_id,
950 response.answer.clone(),
951 response.reviewer.clone(),
952 response.reason.clone(),
953 response.metadata.clone(),
954 )
955 .await
956 .map(|_| ())
957 .map_err(|error| error.to_string())
958 }
959 HitlRequestKind::Escalation => {
960 if !response.accepted.unwrap_or(false)
961 || waitpoint_is_terminal(log, &response.request_id).await?
962 {
963 return Ok(());
964 }
965 complete_waitpoint_on(
966 log,
967 &response.request_id,
968 Some(json!({
969 "accepted": true,
970 "reviewer": response.reviewer,
971 "reason": response.reason,
972 "responded_at": response.responded_at,
973 })),
974 response.reviewer.clone(),
975 response.reason.clone(),
976 response.metadata.clone(),
977 )
978 .await
979 .map(|_| ())
980 .map_err(|error| error.to_string())
981 }
982 HitlRequestKind::Approval | HitlRequestKind::DualControl => {
983 if waitpoint_is_terminal(log, &response.request_id).await? {
984 return Ok(());
985 }
986 let request = load_request_envelope(log, kind, &response.request_id)
987 .await
988 .map_err(|error| error.to_string())?;
989 match resolve_approval_state(log, kind, &request)
990 .await
991 .map_err(|error| error.to_string())?
992 {
993 ApprovalResolution::Pending => Ok(()),
994 ApprovalResolution::Approved(progress) => {
995 let record = approval_record_json(&progress);
996 append_named_event(
997 log,
998 kind,
999 approved_event_kind(kind),
1000 &request.request_id,
1001 &request.trace_id,
1002 json!({
1003 "request_id": request.request_id.clone(),
1004 "record": record.clone(),
1005 }),
1006 )
1007 .await
1008 .map_err(|error| error.to_string())?;
1009 complete_waitpoint_on(
1010 log,
1011 &request.request_id,
1012 Some(record),
1013 response.reviewer.clone(),
1014 progress.reason.clone(),
1015 response.metadata.clone(),
1016 )
1017 .await
1018 .map(|_| ())
1019 .map_err(|error| error.to_string())
1020 }
1021 ApprovalResolution::Denied(denied) => {
1022 append_named_event(
1023 log,
1024 kind,
1025 denied_event_kind(kind),
1026 &request.request_id,
1027 &request.trace_id,
1028 json!({
1029 "request_id": request.request_id.clone(),
1030 "reviewer": denied.reviewer.clone(),
1031 "reason": denied.reason.clone(),
1032 }),
1033 )
1034 .await
1035 .map_err(|error| error.to_string())?;
1036 cancel_waitpoint_on(
1037 log,
1038 &request.request_id,
1039 denied.reviewer.clone(),
1040 denied.reason.clone(),
1041 denied.metadata.clone(),
1042 )
1043 .await
1044 .map(|_| ())
1045 .map_err(|error| error.to_string())
1046 }
1047 }
1048 }
1049 }
1050}
1051
1052async fn waitpoint_is_terminal(log: &Arc<AnyEventLog>, request_id: &str) -> Result<bool, String> {
1053 Ok(inspect_waitpoint_on(log, request_id)
1054 .await
1055 .map_err(|error| error.to_string())?
1056 .is_some_and(|record| record.status != WaitpointStatus::Open))
1057}
1058
1059async fn load_request_envelope(
1060 log: &Arc<AnyEventLog>,
1061 kind: HitlRequestKind,
1062 request_id: &str,
1063) -> Result<HitlRequestEnvelope, VmError> {
1064 let topic = topic(kind)?;
1065 let events = log
1066 .read_range(&topic, None, usize::MAX)
1067 .await
1068 .map_err(log_error)?;
1069 events
1070 .into_iter()
1071 .filter(|(_, event)| event.kind == kind.request_event_kind())
1072 .find_map(|(_, event)| {
1073 if !event_matches_request(&event, request_id) {
1074 return None;
1075 }
1076 serde_json::from_value::<HitlRequestEnvelope>(event.payload).ok()
1077 })
1078 .ok_or_else(|| {
1079 VmError::Runtime(format!("missing HITL request envelope for '{request_id}'"))
1080 })
1081}
1082
1083async fn resolve_approval_state(
1084 log: &Arc<AnyEventLog>,
1085 kind: HitlRequestKind,
1086 request: &HitlRequestEnvelope,
1087) -> Result<ApprovalResolution, VmError> {
1088 let quorum = approval_quorum_from_request(kind, request)?;
1089 let allowed_reviewers = approval_reviewers_from_request(kind, request)
1090 .into_iter()
1091 .collect::<BTreeSet<_>>();
1092 let mut progress = ApprovalProgress {
1093 request_id: request.request_id.clone(),
1094 reviewers: BTreeSet::new(),
1095 signatures: Vec::new(),
1096 reason: None,
1097 approved_at: None,
1098 };
1099 let topic = topic(kind)?;
1100 let events = log
1101 .read_range(&topic, None, usize::MAX)
1102 .await
1103 .map_err(log_error)?;
1104 for (_, event) in events {
1105 if !event_matches_request(&event, &request.request_id)
1106 || event.kind != "hitl.response_received"
1107 {
1108 continue;
1109 }
1110 let response: HitlHostResponse = serde_json::from_value(event.payload)
1111 .map_err(|error| VmError::Runtime(error.to_string()))?;
1112 if let Some(reviewer) = response.reviewer.as_deref() {
1113 if !allowed_reviewers.is_empty() && !allowed_reviewers.contains(reviewer) {
1114 continue;
1115 }
1116 if progress.reviewers.contains(reviewer) {
1117 continue;
1118 }
1119 }
1120 if response.approved.unwrap_or(false) {
1121 if let Some(reviewer) = response.reviewer.clone() {
1122 let signed_at = response.responded_at.clone().unwrap_or_else(now_rfc3339);
1123 progress.reviewers.insert(reviewer.clone());
1124 progress.signatures.push(ApprovalSignature {
1125 reviewer: reviewer.clone(),
1126 signed_at: signed_at.clone(),
1127 signature: response.signature.clone().unwrap_or_else(|| {
1128 approval_receipt_signature(
1129 &request.request_id,
1130 &reviewer,
1131 &signed_at,
1132 true,
1133 response.reason.as_deref(),
1134 )
1135 }),
1136 });
1137 }
1138 progress.reason = response.reason.clone();
1139 progress.approved_at = response.responded_at.clone();
1140 if progress.reviewers.len() as u32 >= quorum {
1141 return Ok(ApprovalResolution::Approved(progress));
1142 }
1143 continue;
1144 }
1145 return Ok(ApprovalResolution::Denied(response));
1146 }
1147 Ok(ApprovalResolution::Pending)
1148}
1149
1150fn approval_quorum_from_request(
1151 kind: HitlRequestKind,
1152 request: &HitlRequestEnvelope,
1153) -> Result<u32, VmError> {
1154 let key = match kind {
1155 HitlRequestKind::DualControl => "n",
1156 _ => "quorum",
1157 };
1158 let quorum = request
1159 .payload
1160 .get(key)
1161 .or_else(|| request.payload.get("approvers_required"))
1162 .or_else(|| {
1163 request
1164 .payload
1165 .get("approval_request")
1166 .and_then(|approval| approval.get("approvers_required"))
1167 })
1168 .and_then(JsonValue::as_u64)
1169 .unwrap_or(1);
1170 u32::try_from(quorum).map_err(|_| {
1171 VmError::Runtime(format!(
1172 "invalid quorum in HITL request '{}'",
1173 request.request_id
1174 ))
1175 })
1176}
1177
1178fn approval_reviewers_from_request(
1179 kind: HitlRequestKind,
1180 request: &HitlRequestEnvelope,
1181) -> Vec<String> {
1182 let key = match kind {
1183 HitlRequestKind::DualControl => "approvers",
1184 _ => "reviewers",
1185 };
1186 request
1187 .payload
1188 .get(key)
1189 .or_else(|| {
1190 request
1191 .payload
1192 .get("approval_request")
1193 .and_then(|approval| approval.get("reviewers"))
1194 })
1195 .and_then(JsonValue::as_array)
1196 .map(|values| {
1197 values
1198 .iter()
1199 .filter_map(JsonValue::as_str)
1200 .map(str::to_string)
1201 .collect()
1202 })
1203 .unwrap_or_default()
1204}
1205
1206fn approval_record_json(progress: &ApprovalProgress) -> JsonValue {
1207 json!({
1208 "request_id": progress.request_id.clone(),
1209 "approved": true,
1210 "reviewers": progress.reviewers.iter().cloned().collect::<Vec<_>>(),
1211 "approved_at": progress.approved_at.clone().unwrap_or_else(now_rfc3339),
1212 "reason": progress.reason,
1213 "signatures": progress.signatures,
1214 })
1215}
1216
1217fn approval_receipt_signature(
1218 request_id: &str,
1219 reviewer: &str,
1220 signed_at: &str,
1221 approved: bool,
1222 reason: Option<&str>,
1223) -> String {
1224 let material = format!(
1225 "harn-hitl-approval-v1\nrequest_id:{request_id}\nreviewer:{reviewer}\nsigned_at:{signed_at}\napproved:{approved}\nreason:{}\n",
1226 reason.unwrap_or("")
1227 );
1228 let hash = sha2::Sha256::digest(material.as_bytes());
1229 let hex: String = hash.iter().map(|byte| format!("{byte:02x}")).collect();
1230 format!("sha256:{hex}")
1231}
1232
1233fn approval_record_from_waitpoint(
1234 record: &WaitpointRecord,
1235 builtin: &str,
1236) -> Result<VmValue, VmError> {
1237 record
1238 .value
1239 .as_ref()
1240 .map(crate::stdlib::json_to_vm_value)
1241 .ok_or_else(|| VmError::Runtime(format!("{builtin}: missing approval record")))
1242}
1243
1244async fn approval_wait_error(
1245 log: &Arc<AnyEventLog>,
1246 kind: HitlRequestKind,
1247 request_id: &str,
1248) -> VmError {
1249 if let Ok(Some(record)) = inspect_waitpoint_on(log, request_id).await {
1250 if record.status == WaitpointStatus::Cancelled
1251 && record.reason.as_deref() != Some("upstream_cancelled")
1252 {
1253 return approval_denied_error(
1254 request_id,
1255 HitlHostResponse {
1256 request_id: request_id.to_string(),
1257 answer: None,
1258 approved: Some(false),
1259 accepted: None,
1260 reviewer: record.cancelled_by.clone(),
1261 reason: record.reason.clone(),
1262 metadata: record.metadata.clone(),
1263 responded_at: record.cancelled_at,
1264 signature: None,
1265 },
1266 );
1267 }
1268 if record.status == WaitpointStatus::Cancelled {
1269 return hitl_cancelled_error(
1270 request_id,
1271 kind,
1272 "",
1273 &[request_id.to_string()],
1274 record.reason,
1275 );
1276 }
1277 }
1278 hitl_cancelled_error(
1279 request_id,
1280 kind,
1281 "",
1282 &[request_id.to_string()],
1283 Some("upstream_cancelled".to_string()),
1284 )
1285}
1286
1287async fn append_timeout_once(
1288 log: &Arc<AnyEventLog>,
1289 kind: HitlRequestKind,
1290 request_id: &str,
1291 trace_id: &str,
1292) -> Result<(), VmError> {
1293 if hitl_event_exists(log, kind, request_id, "hitl.timeout").await? {
1294 return Ok(());
1295 }
1296 append_timeout(log, kind, request_id, trace_id).await
1297}
1298
1299async fn hitl_event_exists(
1300 log: &Arc<AnyEventLog>,
1301 kind: HitlRequestKind,
1302 request_id: &str,
1303 event_kind: &str,
1304) -> Result<bool, VmError> {
1305 let topic = topic(kind)?;
1306 let events = log
1307 .read_range(&topic, None, usize::MAX)
1308 .await
1309 .map_err(log_error)?;
1310 Ok(events
1311 .into_iter()
1312 .any(|(_, event)| event.kind == event_kind && event_matches_request(&event, request_id)))
1313}
1314
1315fn approved_event_kind(kind: HitlRequestKind) -> &'static str {
1316 match kind {
1317 HitlRequestKind::DualControl => "hitl.dual_control_approved",
1318 _ => "hitl.approval_approved",
1319 }
1320}
1321
1322fn denied_event_kind(kind: HitlRequestKind) -> &'static str {
1323 match kind {
1324 HitlRequestKind::DualControl => "hitl.dual_control_denied",
1325 _ => "hitl.approval_denied",
1326 }
1327}
1328
1329async fn append_request(
1330 log: &Arc<AnyEventLog>,
1331 request: &HitlRequestEnvelope,
1332) -> Result<(), VmError> {
1333 let topic = topic(request.kind)?;
1334 log.append(
1335 &topic,
1336 LogEvent::new(
1337 request.kind.request_event_kind(),
1338 serde_json::to_value(request).map_err(|error| VmError::Runtime(error.to_string()))?,
1339 )
1340 .with_headers(request_headers(request)),
1341 )
1342 .await
1343 .map(|_| ())
1344 .map_err(log_error)
1345}
1346
1347async fn append_named_event(
1348 log: &Arc<AnyEventLog>,
1349 kind: HitlRequestKind,
1350 event_kind: &str,
1351 request_id: &str,
1352 trace_id: &str,
1353 payload: JsonValue,
1354) -> Result<(), VmError> {
1355 let topic = topic(kind)?;
1356 let headers = headers_with_trace(request_id, trace_id);
1357 log.append(
1358 &topic,
1359 LogEvent::new(event_kind, payload).with_headers(headers),
1360 )
1361 .await
1362 .map(|_| ())
1363 .map_err(log_error)
1364}
1365
1366async fn append_timeout(
1367 log: &Arc<AnyEventLog>,
1368 kind: HitlRequestKind,
1369 request_id: &str,
1370 trace_id: &str,
1371) -> Result<(), VmError> {
1372 append_named_event(
1373 log,
1374 kind,
1375 "hitl.timeout",
1376 request_id,
1377 trace_id,
1378 serde_json::to_value(HitlTimeoutRecord {
1379 request_id: request_id.to_string(),
1380 kind,
1381 trace_id: trace_id.to_string(),
1382 timed_out_at: now_rfc3339(),
1383 })
1384 .map_err(|error| VmError::Runtime(error.to_string()))?,
1385 )
1386 .await
1387}
1388
1389async fn maybe_apply_mock_response(
1390 kind: HitlRequestKind,
1391 request_id: &str,
1392 request_payload: &JsonValue,
1393) -> Result<(), VmError> {
1394 let mut params = request_payload
1395 .as_object()
1396 .cloned()
1397 .unwrap_or_default()
1398 .into_iter()
1399 .map(|(key, value)| (key, crate::stdlib::json_to_vm_value(&value)))
1400 .collect::<crate::value::DictMap>();
1401 params.put_str("request_id", request_id);
1402 let Some(result) = dispatch_mock_host_call("hitl", kind.as_str(), ¶ms) else {
1403 return Ok(());
1404 };
1405 let value = result?;
1406 let responses = match value {
1407 VmValue::List(items) => items.iter().cloned().collect::<Vec<_>>(),
1408 other => vec![other],
1409 };
1410 for response in responses {
1411 let response_dict = response.as_dict().ok_or_else(|| {
1412 VmError::Runtime(format!(
1413 "mocked HITL {} response must be a dict or list<dict>",
1414 kind.as_str()
1415 ))
1416 })?;
1417 let hitl_response = parse_hitl_response_dict(request_id, response_dict)?;
1418 append_hitl_response(None, hitl_response)
1419 .await
1420 .map_err(VmError::Runtime)?;
1421 }
1422 Ok(())
1423}
1424
1425fn parse_hitl_response_dict(
1426 request_id: &str,
1427 response_dict: &crate::value::DictMap,
1428) -> Result<HitlHostResponse, VmError> {
1429 Ok(HitlHostResponse {
1430 request_id: request_id.to_string(),
1431 answer: response_dict
1432 .get("answer")
1433 .map(crate::llm::vm_value_to_json),
1434 approved: response_dict.get("approved").and_then(vm_bool),
1435 accepted: response_dict.get("accepted").and_then(vm_bool),
1436 reviewer: response_dict.get("reviewer").map(VmValue::display),
1437 reason: response_dict.get("reason").map(VmValue::display),
1438 metadata: response_dict
1439 .get("metadata")
1440 .map(crate::llm::vm_value_to_json),
1441 responded_at: response_dict.get("responded_at").map(VmValue::display),
1442 signature: response_dict.get("signature").map(VmValue::display),
1443 })
1444}
1445
1446fn maybe_notify_host(ctx: Option<&AsyncBuiltinCtx>, request: &HitlRequestEnvelope) {
1447 let Some(bridge) = ctx.and_then(|ctx| ctx.child_vm().bridge.clone()) else {
1448 return;
1449 };
1450 bridge.notify(
1451 "harn.hitl.requested",
1452 serde_json::to_value(request).unwrap_or(JsonValue::Null),
1453 );
1454}
1455
1456fn emit_hitl_requested(request: &HitlRequestEnvelope) {
1463 let Some(session_id) = crate::agent_sessions::current_session_id() else {
1464 return;
1465 };
1466 crate::agent_events::emit_event(&crate::agent_events::AgentEvent::HitlRequested {
1467 session_id,
1468 request_id: request.request_id.clone(),
1469 kind: request.kind.as_str().to_string(),
1470 payload: request.payload.clone(),
1471 });
1472}
1473
1474fn emit_hitl_resolved(request_id: &str, kind: HitlRequestKind, outcome: &str) {
1479 let Some(session_id) = crate::agent_sessions::current_session_id() else {
1480 return;
1481 };
1482 crate::agent_events::emit_event(&crate::agent_events::AgentEvent::HitlResolved {
1483 session_id,
1484 request_id: request_id.to_string(),
1485 kind: kind.as_str().to_string(),
1486 outcome: outcome.to_string(),
1487 });
1488}
1489
1490async fn wait_for_request_waitpoint_with_events(
1497 request_id: &str,
1498 kind: HitlRequestKind,
1499 timeout: Option<StdDuration>,
1500) -> Result<WaitpointOutcome, VmError> {
1501 let outcome = wait_for_request_waitpoint(request_id, timeout).await;
1502 let label = match &outcome {
1503 Ok(WaitpointOutcome::Completed(_)) => "answered",
1504 Ok(WaitpointOutcome::Timeout) => "timeout",
1505 Ok(WaitpointOutcome::Cancelled { .. }) => "cancelled",
1506 Err(_) => "error",
1507 };
1508 emit_hitl_resolved(request_id, kind, label);
1509 outcome
1510}
1511
1512fn parse_ask_user_options(value: Option<&VmValue>) -> Result<AskUserOptions, VmError> {
1513 let Some(value) = value else {
1514 return Ok(AskUserOptions {
1515 schema: None,
1516 timeout: Some(default_question_timeout()),
1517 default: None,
1518 });
1519 };
1520 let dict = value
1521 .as_dict()
1522 .ok_or_else(|| VmError::Runtime("ask_user: options must be a dict".to_string()))?;
1523 Ok(AskUserOptions {
1524 schema: dict
1525 .get("schema")
1526 .cloned()
1527 .filter(|value| !matches!(value, VmValue::Nil)),
1528 timeout: dict
1529 .get("timeout")
1530 .map(parse_duration_value)
1531 .transpose()?
1532 .or_else(|| Some(default_question_timeout())),
1533 default: dict
1534 .get("default")
1535 .cloned()
1536 .filter(|value| !matches!(value, VmValue::Nil)),
1537 })
1538}
1539
1540fn default_question_timeout() -> StdDuration {
1541 StdDuration::from_millis(HITL_QUESTION_TIMEOUT_MS)
1542}
1543
1544fn escalation_capability_policy() -> JsonValue {
1545 crate::orchestration::current_execution_policy()
1546 .and_then(|policy| serde_json::to_value(policy).ok())
1547 .unwrap_or(JsonValue::Null)
1548}
1549
1550fn parse_approval_options(
1551 value: Option<&VmValue>,
1552 builtin: &str,
1553) -> Result<ApprovalOptions, VmError> {
1554 let dict = match value {
1555 None => None,
1556 Some(VmValue::Dict(dict)) => Some(dict),
1557 Some(_) => {
1558 return Err(VmError::Runtime(format!(
1559 "{builtin}: options must be a dict"
1560 )))
1561 }
1562 };
1563 let quorum = dict
1564 .and_then(|dict| dict.get("quorum"))
1565 .and_then(VmValue::as_int)
1566 .unwrap_or(1);
1567 if quorum <= 0 {
1568 return Err(VmError::Runtime(format!(
1569 "{builtin}: quorum must be positive"
1570 )));
1571 }
1572 let reviewers = optional_string_list(dict.and_then(|dict| dict.get("reviewers")), builtin)?;
1573 let capabilities_requested = optional_string_list(
1574 dict.and_then(|dict| dict.get("capabilities_requested")),
1575 builtin,
1576 )?;
1577 let evidence_refs = dict
1578 .and_then(|dict| dict.get("evidence_refs"))
1579 .map(|value| match value {
1580 VmValue::List(items) => Ok(items
1581 .iter()
1582 .map(crate::llm::vm_value_to_json)
1583 .collect::<Vec<_>>()),
1584 _ => Err(VmError::Runtime(format!(
1585 "{builtin}: evidence_refs must be a list"
1586 ))),
1587 })
1588 .transpose()?
1589 .unwrap_or_default();
1590 let deadline = dict
1591 .and_then(|dict| dict.get("deadline"))
1592 .map(parse_duration_value)
1593 .transpose()?
1594 .unwrap_or_else(|| StdDuration::from_millis(HITL_APPROVAL_TIMEOUT_MS));
1595 Ok(ApprovalOptions {
1596 detail: dict.and_then(|dict| dict.get("detail")).cloned(),
1597 args: dict.and_then(|dict| dict.get("args")).cloned(),
1598 quorum: quorum as u32,
1599 reviewers,
1600 deadline,
1601 principal: dict
1602 .and_then(|dict| dict.get("principal"))
1603 .map(VmValue::display)
1604 .filter(|value| !value.is_empty()),
1605 evidence_refs,
1606 undo_metadata: dict
1607 .and_then(|dict| dict.get("undo_metadata"))
1608 .map(crate::llm::vm_value_to_json),
1609 capabilities_requested,
1610 })
1611}
1612
1613fn required_string_arg(args: &[VmValue], idx: usize, builtin: &str) -> Result<String, VmError> {
1614 args.get(idx)
1615 .map(VmValue::display)
1616 .filter(|value| !value.is_empty())
1617 .ok_or_else(|| VmError::Runtime(format!("{builtin}: expected string argument at {idx}")))
1618}
1619
1620fn required_positive_int_arg(args: &[VmValue], idx: usize, builtin: &str) -> Result<i64, VmError> {
1621 let value = args
1622 .get(idx)
1623 .and_then(VmValue::as_int)
1624 .ok_or_else(|| VmError::Runtime(format!("{builtin}: expected int argument at {idx}")))?;
1625 if value <= 0 {
1626 return Err(VmError::Runtime(format!(
1627 "{builtin}: expected a positive int at {idx}"
1628 )));
1629 }
1630 Ok(value)
1631}
1632
1633fn optional_string_list(value: Option<&VmValue>, builtin: &str) -> Result<Vec<String>, VmError> {
1634 let Some(value) = value else {
1635 return Ok(Vec::new());
1636 };
1637 match value {
1638 VmValue::List(list) => Ok(list.iter().map(VmValue::display).collect()),
1639 _ => Err(VmError::Runtime(format!(
1640 "{builtin}: expected list<string>"
1641 ))),
1642 }
1643}
1644
1645fn parse_duration_value(value: &VmValue) -> Result<StdDuration, VmError> {
1646 duration_from_value(value, "hitl", "timeout", ErrorKind::Runtime)
1647}
1648
1649fn ensure_hitl_event_log() -> Arc<AnyEventLog> {
1650 active_event_log()
1651 .unwrap_or_else(|| install_memory_for_current_thread(HITL_EVENT_LOG_QUEUE_DEPTH))
1652}
1653
1654fn ensure_hitl_event_log_for(base_dir: Option<&Path>) -> Result<Arc<AnyEventLog>, String> {
1655 if let Some(log) = active_event_log() {
1656 return Ok(log);
1657 }
1658 let Some(base_dir) = base_dir else {
1659 return Ok(install_memory_for_current_thread(
1660 HITL_EVENT_LOG_QUEUE_DEPTH,
1661 ));
1662 };
1663 install_default_for_base_dir(base_dir).map_err(|error| error.to_string())
1664}
1665
1666fn current_dispatch_keys() -> Option<DispatchKeys> {
1667 let context = current_dispatch_context()?;
1668 let stable_base = context
1669 .replay_of_event_id
1670 .clone()
1671 .unwrap_or_else(|| context.trigger_event.id.0.clone());
1672 let instance_key = format!(
1673 "{}::{}",
1674 context.trigger_event.id.0,
1675 context.replay_of_event_id.as_deref().unwrap_or("live")
1676 );
1677 Some(DispatchKeys {
1678 instance_key,
1679 stable_base,
1680 agent: context.agent_id,
1681 trace_id: context.trigger_event.trace_id.0,
1682 })
1683}
1684
1685fn next_request_id(kind: HitlRequestKind, dispatch_keys: Option<&DispatchKeys>) -> String {
1686 if let Some(keys) = dispatch_keys {
1687 let seq = REQUEST_SEQUENCE.with(|slot| {
1688 let mut state = slot.borrow_mut();
1689 if state.instance_key != keys.instance_key {
1690 state.instance_key = keys.instance_key.clone();
1691 state.next_seq = 0;
1692 }
1693 state.next_seq += 1;
1694 state.next_seq
1695 });
1696 return format!("hitl_{}_{}_{}", kind.as_str(), keys.stable_base, seq);
1697 }
1698 format!("hitl_{}_{}", kind.as_str(), Uuid::now_v7())
1699}
1700
1701fn request_headers(request: &HitlRequestEnvelope) -> BTreeMap<String, String> {
1702 let mut headers = headers_with_trace(&request.request_id, &request.trace_id);
1703 if let Some(run_id) = request.run_id.as_ref() {
1704 headers.insert("run_id".to_string(), run_id.clone());
1705 }
1706 headers
1707}
1708
1709fn response_headers(request_id: &str) -> BTreeMap<String, String> {
1710 let mut headers = std::collections::BTreeMap::new();
1711 headers.insert("request_id".to_string(), request_id.to_string());
1712 headers
1713}
1714
1715fn headers_with_trace(request_id: &str, trace_id: &str) -> BTreeMap<String, String> {
1716 let mut headers = response_headers(request_id);
1717 headers.insert("trace_id".to_string(), trace_id.to_string());
1718 headers
1719}
1720
1721fn topic(kind: HitlRequestKind) -> Result<Topic, VmError> {
1722 Topic::new(kind.topic()).map_err(|error| VmError::Runtime(error.to_string()))
1723}
1724
1725fn event_matches_request(event: &LogEvent, request_id: &str) -> bool {
1726 event
1727 .headers
1728 .get("request_id")
1729 .is_some_and(|value| value == request_id)
1730 || event
1731 .payload
1732 .get("request_id")
1733 .and_then(JsonValue::as_str)
1734 .is_some_and(|value| value == request_id)
1735}
1736
1737fn approval_denied_error(request_id: &str, response: HitlHostResponse) -> VmError {
1738 VmError::Thrown(crate::stdlib::json_to_vm_value(&json!({
1739 "name": "ApprovalDeniedError",
1740 "category": "generic",
1741 "message": response.reason.clone().unwrap_or_else(|| "approval was denied".to_string()),
1742 "request_id": request_id,
1743 "reviewers": response.reviewer.into_iter().collect::<Vec<_>>(),
1744 "reason": response.reason,
1745 })))
1746}
1747
1748fn hitl_cancelled_error(
1749 request_id: &str,
1750 kind: HitlRequestKind,
1751 wait_id: &str,
1752 waitpoint_ids: &[String],
1753 reason: Option<String>,
1754) -> VmError {
1755 let _ = categorized_error("HITL cancelled", ErrorCategory::Cancelled);
1756 let message = reason
1757 .clone()
1758 .unwrap_or_else(|| format!("{} cancelled", kind.as_str()));
1759 VmError::Thrown(crate::stdlib::json_to_vm_value(&json!({
1760 "name": "HumanCancelledError",
1761 "category": ErrorCategory::Cancelled.as_str(),
1762 "message": message,
1763 "request_id": request_id,
1764 "kind": kind.as_str(),
1765 "wait_id": wait_id,
1766 "waitpoint_ids": waitpoint_ids,
1767 "reason": reason,
1768 })))
1769}
1770
1771fn timeout_error(request_id: &str, kind: HitlRequestKind) -> VmError {
1772 let _ = categorized_error("HITL timed out", ErrorCategory::Timeout);
1773 VmError::Thrown(crate::stdlib::json_to_vm_value(&json!({
1774 "name": "HumanTimeoutError",
1775 "category": ErrorCategory::Timeout.as_str(),
1776 "message": format!("{} timed out", kind.as_str()),
1777 "request_id": request_id,
1778 "kind": kind.as_str(),
1779 })))
1780}
1781
1782fn coerce_like_default(value: &VmValue, default: &VmValue) -> VmValue {
1783 match default {
1784 VmValue::Int(_) => match value {
1785 VmValue::Int(_) => value.clone(),
1786 VmValue::Float(number) => VmValue::Int(*number as i64),
1787 VmValue::String(text) => text
1788 .parse::<i64>()
1789 .map(VmValue::Int)
1790 .unwrap_or_else(|_| default.clone()),
1791 _ => default.clone(),
1792 },
1793 VmValue::Float(_) => match value {
1794 VmValue::Float(_) => value.clone(),
1795 VmValue::Int(number) => VmValue::Float(*number as f64),
1796 VmValue::String(text) => text
1797 .parse::<f64>()
1798 .map(VmValue::Float)
1799 .unwrap_or_else(|_| default.clone()),
1800 _ => default.clone(),
1801 },
1802 VmValue::Bool(_) => match value {
1803 VmValue::Bool(_) => value.clone(),
1804 VmValue::String(text) if text.eq_ignore_ascii_case("true") => VmValue::Bool(true),
1805 VmValue::String(text) if text.eq_ignore_ascii_case("false") => VmValue::Bool(false),
1806 _ => default.clone(),
1807 },
1808 VmValue::String(_) => VmValue::String(std::sync::Arc::from(value.display())),
1809 VmValue::Duration(_) => match value {
1810 VmValue::Duration(_) => value.clone(),
1811 VmValue::Int(ms) => VmValue::Duration(*ms),
1812 _ => default.clone(),
1813 },
1814 VmValue::Nil => value.clone(),
1815 _ => {
1816 if value.type_name() == default.type_name() {
1817 value.clone()
1818 } else {
1819 default.clone()
1820 }
1821 }
1822 }
1823}
1824
1825fn log_error(error: impl std::fmt::Display) -> VmError {
1826 VmError::Runtime(error.to_string())
1827}
1828
1829fn now_rfc3339() -> String {
1830 format_rfc3339(OffsetDateTime::now_utc())
1831}
1832
1833fn format_rfc3339(timestamp: OffsetDateTime) -> String {
1834 timestamp
1835 .format(&Rfc3339)
1836 .unwrap_or_else(|_| timestamp.to_string())
1837}
1838
1839fn deadline_after(requested_at: OffsetDateTime, duration: StdDuration) -> Option<String> {
1840 time::Duration::try_from(duration)
1841 .ok()
1842 .map(|duration| format_rfc3339(requested_at + duration))
1843}
1844
1845fn new_trace_id() -> String {
1846 format!("trace_{}", Uuid::now_v7())
1847}
1848
1849fn vm_bool(value: &VmValue) -> Option<bool> {
1850 match value {
1851 VmValue::Bool(flag) => Some(*flag),
1852 _ => None,
1853 }
1854}
1855
1856fn vm_string(value: &VmValue) -> Option<&str> {
1857 match value {
1858 VmValue::String(text) => Some(text.as_ref()),
1859 _ => None,
1860 }
1861}
1862
1863fn vm_string_list(value: &VmValue) -> Option<Vec<String>> {
1864 match value {
1865 VmValue::List(values) => Some(values.iter().map(VmValue::display).collect()),
1866 _ => None,
1867 }
1868}
1869
1870#[cfg(test)]
1871mod tests {
1872 use std::sync::OnceLock;
1873
1874 use tokio::sync::Mutex;
1875
1876 use super::{
1877 HITL_APPROVALS_TOPIC, HITL_DUAL_CONTROL_TOPIC, HITL_ESCALATIONS_TOPIC, HITL_QUESTIONS_TOPIC,
1878 };
1879 use crate::event_log::{install_default_for_base_dir, EventLog, Topic};
1880 use crate::{compile_source, register_vm_stdlib, reset_thread_local_state, Vm, VmError};
1881
1882 fn hitl_lock() -> &'static Mutex<()> {
1893 static LOCK: OnceLock<Mutex<()>> = OnceLock::new();
1894 LOCK.get_or_init(|| Mutex::new(()))
1895 }
1896
1897 async fn execute_hitl_script(
1898 base_dir: &std::path::Path,
1899 source: &str,
1900 ) -> Result<(String, Vec<String>, Vec<String>, Vec<String>, Vec<String>), VmError> {
1901 reset_thread_local_state();
1902 let log = install_default_for_base_dir(base_dir).expect("install event log");
1903 let chunk = compile_source(source).expect("compile source");
1904 let mut vm = Vm::new();
1905 register_vm_stdlib(&mut vm);
1906 vm.set_source_dir(base_dir);
1907 vm.execute(&chunk).await?;
1908 let output = vm.output().trim_end().to_string();
1909 let question_events = event_kinds(log.clone(), HITL_QUESTIONS_TOPIC).await;
1910 let approval_events = event_kinds(log.clone(), HITL_APPROVALS_TOPIC).await;
1911 let dual_control_events = event_kinds(log.clone(), HITL_DUAL_CONTROL_TOPIC).await;
1912 let escalation_events = event_kinds(log, HITL_ESCALATIONS_TOPIC).await;
1913 Ok((
1914 output,
1915 question_events,
1916 approval_events,
1917 dual_control_events,
1918 escalation_events,
1919 ))
1920 }
1921
1922 async fn event_kinds(
1923 log: std::sync::Arc<crate::event_log::AnyEventLog>,
1924 topic: &str,
1925 ) -> Vec<String> {
1926 log.read_range(&Topic::new(topic).expect("valid topic"), None, usize::MAX)
1927 .await
1928 .expect("read topic")
1929 .into_iter()
1930 .map(|(_, event)| event.kind)
1931 .collect()
1932 }
1933
1934 async fn event_payloads(
1935 log: std::sync::Arc<crate::event_log::AnyEventLog>,
1936 topic: &str,
1937 ) -> Vec<serde_json::Value> {
1938 log.read_range(&Topic::new(topic).expect("valid topic"), None, usize::MAX)
1939 .await
1940 .expect("read topic")
1941 .into_iter()
1942 .map(|(_, event)| event.payload)
1943 .collect()
1944 }
1945
1946 #[tokio::test(flavor = "current_thread")]
1947 async fn ask_user_coerces_to_default_type_and_logs_events() {
1948 tokio::task::LocalSet::new()
1949 .run_until(async {
1950 let dir = tempfile::tempdir().expect("tempdir");
1951 let source = r#"
1952pipeline test(task) {
1953 host_mock("hitl", "question", {answer: "9"})
1954 let answer: int = ask_user("Pick a number", {default: 0})
1955 __io_println(answer)
1956}
1957"#;
1958 let (
1959 output,
1960 question_events,
1961 approval_events,
1962 dual_control_events,
1963 escalation_events,
1964 ) = execute_hitl_script(dir.path(), source)
1965 .await
1966 .expect("script succeeds");
1967 assert_eq!(output, "9");
1968 assert_eq!(
1969 question_events,
1970 vec![
1971 "hitl.question_asked".to_string(),
1972 "hitl.response_received".to_string()
1973 ]
1974 );
1975 assert!(approval_events.is_empty());
1976 assert!(dual_control_events.is_empty());
1977 assert!(escalation_events.is_empty());
1978 })
1979 .await;
1980 }
1981
1982 #[tokio::test(flavor = "current_thread")]
1983 async fn request_approval_waits_for_quorum_and_emits_a_record() {
1984 let _guard = hitl_lock().lock().await;
1985 tokio::task::LocalSet::new()
1986 .run_until(async {
1987 reset_thread_local_state();
1988 let dir = tempfile::tempdir().expect("tempdir");
1989 let source = r#"
1990pipeline test(task) {
1991 host_mock("hitl", "approval", [
1992 {approved: true, reviewer: "alice", reason: "ok"},
1993 {approved: true, reviewer: "bob", reason: "ship it"},
1994 ])
1995 let record = request_approval(
1996 "deploy production",
1997 {quorum: 2, reviewers: ["alice", "bob", "carol"]},
1998 )
1999 __io_println(record.approved)
2000 __io_println(len(record.reviewers))
2001 __io_println(record.reviewers[0])
2002 __io_println(record.reviewers[1])
2003}
2004"#;
2005 let (_, _, approval_events, _, _) = execute_hitl_script(dir.path(), source)
2006 .await
2007 .expect("script succeeds");
2008 assert_eq!(
2009 approval_events,
2010 vec![
2011 "hitl.approval_requested".to_string(),
2012 "hitl.response_received".to_string(),
2013 "hitl.response_received".to_string(),
2014 "hitl.approval_approved".to_string(),
2015 ]
2016 );
2017 })
2018 .await;
2019 }
2020
2021 #[tokio::test(flavor = "current_thread")]
2022 async fn request_approval_emits_canonical_approval_request_payload() {
2023 tokio::task::LocalSet::new()
2024 .run_until(async {
2025 reset_thread_local_state();
2026 let dir = tempfile::tempdir().expect("tempdir");
2027 let log = install_default_for_base_dir(dir.path()).expect("install event log");
2028 let source = r#"
2029pipeline test(task) {
2030 host_mock("hitl", "approval", {approved: true, reviewer: "alice", reason: "ok"})
2031 request_approval("deploy production", {
2032 args: {environment: "prod"},
2033 quorum: 1,
2034 reviewers: ["alice"],
2035 evidence_refs: [{kind: "run", uri: "run_123"}],
2036 undo_metadata: {strategy: "rollback"},
2037 capabilities_requested: ["deploy.production"],
2038 })
2039}
2040"#;
2041 let chunk = compile_source(source).expect("compile source");
2042 let mut vm = Vm::new();
2043 register_vm_stdlib(&mut vm);
2044 vm.set_source_dir(dir.path());
2045 vm.execute(&chunk).await.expect("script succeeds");
2046
2047 let payloads = event_payloads(log, HITL_APPROVALS_TOPIC).await;
2048 let request_payload = &payloads[0]["payload"];
2049 let approval_request = &request_payload["approval_request"];
2050 assert_eq!(approval_request["id"], request_payload["id"]);
2051 assert_eq!(approval_request["action"], "deploy production");
2052 assert_eq!(approval_request["args"]["environment"], "prod");
2053 assert_eq!(approval_request["approvers_required"], 1);
2054 assert_eq!(approval_request["evidence_refs"][0]["uri"], "run_123");
2055 assert_eq!(approval_request["undo_metadata"]["strategy"], "rollback");
2056 assert_eq!(
2057 approval_request["capabilities_requested"][0],
2058 "deploy.production"
2059 );
2060 assert!(approval_request["requested_at"].as_str().is_some());
2061 assert!(approval_request["deadline"].as_str().is_some());
2062 })
2063 .await;
2064 }
2065
2066 #[tokio::test(flavor = "current_thread")]
2067 async fn request_approval_surfaces_denials_as_typed_errors() {
2068 let _guard = hitl_lock().lock().await;
2069 tokio::task::LocalSet::new()
2070 .run_until(async {
2071 reset_thread_local_state();
2072 let dir = tempfile::tempdir().expect("tempdir");
2073 let source = r#"
2074pipeline test(task) {
2075 host_mock("hitl", "approval", {approved: false, reviewer: "alice", reason: "unsafe"})
2076 let denied = try {
2077 request_approval("drop table", {reviewers: ["alice"]})
2078 }
2079 __io_println(is_err(denied))
2080 __io_println(unwrap_err(denied).name)
2081 __io_println(unwrap_err(denied).reason)
2082}
2083"#;
2084 let (output, _, approval_events, _, _) = execute_hitl_script(dir.path(), source)
2085 .await
2086 .expect("script succeeds");
2087 assert_eq!(output, "true\nApprovalDeniedError\nunsafe");
2088 assert_eq!(
2089 approval_events,
2090 vec![
2091 "hitl.approval_requested".to_string(),
2092 "hitl.response_received".to_string(),
2093 "hitl.approval_denied".to_string(),
2094 ]
2095 );
2096 })
2097 .await;
2098 }
2099
2100 #[tokio::test(flavor = "current_thread")]
2101 async fn dual_control_executes_action_after_quorum() {
2102 tokio::task::LocalSet::new()
2103 .run_until(async {
2104 let dir = tempfile::tempdir().expect("tempdir");
2105 let source = r#"
2106pipeline test(task) {
2107 host_mock("hitl", "dual_control", [
2108 {approved: true, reviewer: "alice"},
2109 {approved: true, reviewer: "bob"},
2110 ])
2111 let result = dual_control(2, 3, { -> "launched" }, ["alice", "bob", "carol"])
2112 __io_println(result)
2113}
2114"#;
2115 let (output, _, _, dual_control_events, _) =
2116 execute_hitl_script(dir.path(), source)
2117 .await
2118 .expect("script succeeds");
2119 assert_eq!(output, "launched");
2120 assert_eq!(
2121 dual_control_events,
2122 vec![
2123 "hitl.dual_control_requested".to_string(),
2124 "hitl.response_received".to_string(),
2125 "hitl.response_received".to_string(),
2126 "hitl.dual_control_approved".to_string(),
2127 "hitl.dual_control_executed".to_string(),
2128 ]
2129 );
2130 })
2131 .await;
2132 }
2133
2134 #[tokio::test(flavor = "current_thread")]
2135 async fn escalate_to_waits_for_acceptance_event() {
2136 tokio::task::LocalSet::new()
2137 .run_until(async {
2138 let dir = tempfile::tempdir().expect("tempdir");
2139 let source = r#"
2140pipeline test(task) {
2141 host_mock("hitl", "escalation", {accepted: true, reviewer: "lead", reason: "taking over"})
2142 let handle = escalate_to("admin", "need override")
2143 __io_println(handle.status)
2144 __io_println(handle.reviewer)
2145}
2146"#;
2147 let (output, _, _, _, escalation_events) = execute_hitl_script(dir.path(), source)
2148 .await
2149 .expect("script succeeds");
2150 assert_eq!(output, "accepted\nlead");
2151 assert_eq!(
2152 escalation_events,
2153 vec![
2154 "hitl.escalation_issued".to_string(),
2155 "hitl.escalation_accepted".to_string(),
2156 ]
2157 );
2158 })
2159 .await;
2160 }
2161
2162 #[tokio::test(flavor = "current_thread")]
2168 async fn ask_user_emits_hitl_request_and_resolution_to_agent_event_sinks() {
2169 use std::sync::Mutex as StdMutex;
2170
2171 tokio::task::LocalSet::new()
2172 .run_until(async {
2173 let dir = tempfile::tempdir().expect("tempdir");
2174 let session_id = "hitl-session".to_string();
2175 let captured: std::sync::Arc<StdMutex<Vec<crate::agent_events::AgentEvent>>> =
2176 std::sync::Arc::new(StdMutex::new(Vec::new()));
2177
2178 struct CaptureSink(std::sync::Arc<StdMutex<Vec<crate::agent_events::AgentEvent>>>);
2179 impl crate::agent_events::AgentEventSink for CaptureSink {
2180 fn handle_event(&self, event: &crate::agent_events::AgentEvent) {
2181 self.0.lock().expect("captured").push(event.clone());
2182 }
2183 }
2184
2185 crate::reset_thread_local_state();
2191 crate::event_log::install_default_for_base_dir(dir.path())
2192 .expect("install event log");
2193
2194 crate::agent_events::reset_all_sinks();
2195 let sink: std::sync::Arc<dyn crate::agent_events::AgentEventSink> =
2196 std::sync::Arc::new(CaptureSink(captured.clone()));
2197 crate::agent_events::register_sink(session_id.clone(), sink);
2198 crate::agent_sessions::open_or_create(Some(session_id.clone()));
2199 let _guard = crate::agent_sessions::enter_current_session(session_id.clone());
2200
2201 let source = r#"
2202pipeline test(task) {
2203 host_mock("hitl", "question", {answer: "ok"})
2204 let answer: string = ask_user("Are you sure?", {default: "no"})
2205 __io_println(answer)
2206}
2207"#;
2208 let chunk = crate::compile_source(source).expect("compile source");
2209 let mut vm = Vm::new();
2210 register_vm_stdlib(&mut vm);
2211 vm.set_source_dir(dir.path());
2212 vm.execute(&chunk).await.expect("script runs");
2213 assert_eq!(vm.output().trim_end(), "ok");
2214
2215 let events = captured.lock().expect("captured");
2216 let mut iter = events.iter().filter(|event| {
2217 matches!(
2218 event,
2219 crate::agent_events::AgentEvent::HitlRequested { .. }
2220 | crate::agent_events::AgentEvent::HitlResolved { .. }
2221 )
2222 });
2223 let requested = iter.next().expect("HitlRequested emitted");
2224 let resolved = iter.next().expect("HitlResolved emitted");
2225 assert!(iter.next().is_none(), "exactly one pair: {events:?}");
2226
2227 let crate::agent_events::AgentEvent::HitlRequested {
2228 session_id: req_session,
2229 request_id: req_id,
2230 kind: req_kind,
2231 payload,
2232 } = requested
2233 else {
2234 panic!("expected HitlRequested, got: {requested:?}");
2235 };
2236 assert_eq!(req_session, &session_id);
2237 assert_eq!(req_kind, "question");
2238 assert!(req_id.starts_with("hitl_question_"));
2239 assert_eq!(payload["prompt"], "Are you sure?");
2240
2241 let crate::agent_events::AgentEvent::HitlResolved {
2242 request_id: res_id,
2243 kind: res_kind,
2244 outcome,
2245 ..
2246 } = resolved
2247 else {
2248 panic!("expected HitlResolved, got: {resolved:?}");
2249 };
2250 assert_eq!(res_id, req_id);
2251 assert_eq!(res_kind, "question");
2252 assert_eq!(outcome, "answered");
2253
2254 drop(_guard);
2255 crate::agent_events::reset_all_sinks();
2256 })
2257 .await;
2258 }
2259}