harn_vm/agent_events/agent.rs
1use serde::{Deserialize, Serialize};
2
3use crate::composition::{CompositionChildCall, CompositionChildResult, CompositionRunEnvelope};
4use crate::llm::receipts::ToolCallReceipt;
5use crate::orchestration::{HandoffArtifact, MutationSessionRecord};
6use crate::tool_annotations::ToolKind;
7
8use super::tool::{ToolCallErrorCategory, ToolCallStatus, ToolExecutor};
9use super::worker::{FsWatchEvent, WorkerEvent};
10
11/// Events emitted by the agent loop. Some variants map 1:1 to ACP
12/// `sessionUpdate` variants; Harn-specific lifecycle events ride on the
13/// extension stream.
14#[derive(Clone, Debug, Serialize, Deserialize)]
15#[serde(tag = "type", rename_all = "snake_case")]
16pub enum AgentEvent {
17 AgentMessageChunk {
18 session_id: String,
19 content: String,
20 },
21 AgentThoughtChunk {
22 session_id: String,
23 content: String,
24 },
25 UserMessage {
26 session_id: String,
27 message_id: String,
28 content: Vec<serde_json::Value>,
29 },
30 ToolCall {
31 session_id: String,
32 tool_call_id: String,
33 tool_name: String,
34 kind: Option<ToolKind>,
35 status: ToolCallStatus,
36 raw_input: serde_json::Value,
37 /// Set to `Some(true)` by the streaming candidate detector
38 /// (harn#692) when this event represents a tool-call shape
39 /// detected in the model's in-flight assistant text but whose
40 /// arguments have not finished parsing yet. Clients can render a
41 /// spinner / placeholder while the model writes the body. The
42 /// detector follows up with a `ToolCallUpdate { parsing: false,
43 /// .. }` carrying either `status: pending` (promoted) or
44 /// `status: failed` with `error_category: parse_aborted`.
45 /// `None` (the default) means "this is a normal post-parse tool
46 /// call, no candidate phase was active" so the on-disk shape
47 /// stays compatible with replays recorded before this field
48 /// existed.
49 #[serde(default, skip_serializing_if = "Option::is_none")]
50 parsing: Option<bool>,
51 /// Mutation-session audit context active when the tool was
52 /// dispatched (see harn#699). Hosts use it to group every tool
53 /// emission belonging to the same write-capable session.
54 #[serde(default, skip_serializing_if = "Option::is_none")]
55 audit: Option<MutationSessionRecord>,
56 },
57 ToolCallUpdate {
58 session_id: String,
59 tool_call_id: String,
60 tool_name: String,
61 status: ToolCallStatus,
62 raw_output: Option<serde_json::Value>,
63 error: Option<String>,
64 /// Wall-clock milliseconds from the parse-to-execution boundary
65 /// to the terminal `Completed`/`Failed` update. Includes the
66 /// time spent in any wrapping orchestration logic (loop checks,
67 /// post-tool hooks, microcompaction). Populated only on the
68 /// terminal update — `None` on intermediate `Pending` /
69 /// `InProgress` updates so clients can ignore the field until
70 /// it shows up.
71 #[serde(default, skip_serializing_if = "Option::is_none")]
72 duration_ms: Option<u64>,
73 /// Milliseconds spent in the actual host/builtin/MCP dispatch
74 /// call only (the inner `dispatch_tool_execution` window).
75 /// Populated only on the terminal update; `None` otherwise.
76 #[serde(default, skip_serializing_if = "Option::is_none")]
77 execution_duration_ms: Option<u64>,
78 /// Structured classification of the failure (when `status` is
79 /// `Failed`). Paired with `error` so clients can render each
80 /// category distinctly without parsing free-form strings. Always
81 /// `None` for non-Failed updates and serialized as
82 /// `errorCategory` in the ACP wire format.
83 #[serde(default, skip_serializing_if = "Option::is_none")]
84 error_category: Option<ToolCallErrorCategory>,
85 /// Where the tool actually ran. `None` only for events emitted
86 /// from sites that pre-date the dispatch decision (e.g. the
87 /// pending → in-progress transition the loop emits before the
88 /// dispatcher picks a backend).
89 #[serde(default, skip_serializing_if = "Option::is_none")]
90 executor: Option<ToolExecutor>,
91 /// Companion to `ToolCall.parsing` (harn#692). The streaming
92 /// candidate detector emits the *terminal* candidate event as a
93 /// `ToolCallUpdate` with `parsing: Some(false)` to retract the
94 /// in-flight `parsing: true` chip — either by promoting the
95 /// candidate (`status: pending`, populated `raw_output: None`,
96 /// `error: None`) or aborting it (`status: failed`,
97 /// `error_category: parse_aborted`). `None` means this update is
98 /// not part of a candidate-phase transition.
99 #[serde(default, skip_serializing_if = "Option::is_none")]
100 parsing: Option<bool>,
101 /// Best-effort partial parse of the streamed tool-call arguments.
102 /// Populated by the SSE transport on `Pending` updates as the
103 /// model streams `input_json_delta` (Anthropic) or
104 /// `tool_calls[].function.arguments` deltas (OpenAI). `None` on
105 /// terminal updates and on emissions from non-streaming paths
106 /// (#693). When the partial bytes are not yet parseable as JSON
107 /// the transport falls back to `raw_input_partial`.
108 #[serde(default, skip_serializing_if = "Option::is_none")]
109 raw_input: Option<serde_json::Value>,
110 /// Raw concatenated bytes of the streamed tool-call arguments
111 /// when a permissive parse failed (#693). Mutually exclusive
112 /// with `raw_input`: clients render whichever is present.
113 #[serde(default, skip_serializing_if = "Option::is_none")]
114 raw_input_partial: Option<String>,
115 /// Mutation-session audit context for the tool call. Carries the
116 /// same payload as on the paired `ToolCall` event so a host
117 /// processing a single update doesn't have to correlate against
118 /// the prior pending event.
119 #[serde(default, skip_serializing_if = "Option::is_none")]
120 audit: Option<MutationSessionRecord>,
121 },
122 Plan {
123 session_id: String,
124 plan: serde_json::Value,
125 },
126 ProgressReported {
127 session_id: String,
128 message: Option<String>,
129 entries: serde_json::Value,
130 replace: bool,
131 metadata: serde_json::Value,
132 },
133 /// Emitted when the compass observes a freeform edit and either
134 /// suggests a structural primitive, rewrites the tool call, or falls
135 /// back because rewrite mode could not prove equivalence.
136 CompassRoutingDecision {
137 session_id: String,
138 tool_call_id: String,
139 mode: String,
140 action: String,
141 persona: String,
142 original_tool: String,
143 routed_tool: String,
144 target_tool: String,
145 #[serde(default, skip_serializing_if = "Option::is_none")]
146 path: Option<String>,
147 },
148 /// Emitted after an agent scratchpad reorganization attempt. The
149 /// scratchpad body itself stays in session state; this event carries
150 /// status and count/error metadata so live UIs and eval harnesses can
151 /// audit whether reorganization helped or damaged the working set.
152 AgentScratchpadReorganization {
153 session_id: String,
154 iteration: usize,
155 status: String,
156 details: serde_json::Value,
157 },
158 /// A renderable, declarative artifact spec emitted by an agent. Harn
159 /// validates the payload and transports it; host surfaces own rendering
160 /// and may fall back to the plain-text representation.
161 Artifact {
162 session_id: String,
163 artifact_id: String,
164 kind: String,
165 #[serde(default, skip_serializing_if = "Option::is_none")]
166 title: Option<String>,
167 mime_type: String,
168 spec: serde_json::Value,
169 fallback: String,
170 size_bytes: u64,
171 provenance: serde_json::Value,
172 metadata: serde_json::Value,
173 },
174 /// Fires at the top of every model round-trip inside an
175 /// `agent_loop` invocation. Maps to the `iteration_start` steering
176 /// seam. Not the same as ACP's outer `prompt_turn` boundary; an
177 /// `agent_turn`/`prompt_turn` cycle contains many of these.
178 IterationStart {
179 session_id: String,
180 iteration: usize,
181 /// Configured provider for the impending LLM call. Empty when the
182 /// caller defers provider selection to the routing layer.
183 /// Surfaces here so observers can show "about to call X/Y" before
184 /// the call returns — previously this only landed in the
185 /// transcript after the response, leaving live pulse-check
186 /// consumers without a model attribution for in-flight iterations.
187 #[serde(default, skip_serializing_if = "String::is_empty")]
188 provider: String,
189 /// Configured model id. Same semantics as `provider`.
190 #[serde(default, skip_serializing_if = "String::is_empty")]
191 model: String,
192 },
193 /// Fires at the bottom of every model round-trip, after tool
194 /// dispatch (or after the dispatch was skipped). Sibling of
195 /// `IterationStart`.
196 IterationEnd {
197 session_id: String,
198 iteration: usize,
199 /// Free-form dict carrying the post-call snapshot. Stable keys
200 /// emitted by the agent loop: `tool_count`, `text`, plus the
201 /// LLM-result projection — `provider`, `model`, `response_ms`,
202 /// `input_tokens`, `output_tokens`, `thinking_chars`. Hosts that
203 /// surface latency/cost panes key off these without re-parsing
204 /// the transcript JSONL.
205 iteration_info: serde_json::Value,
206 },
207 /// Emitted when a first-class agent session is explicitly closed by
208 /// `agent_session_close`. This gives event-log consumers a typed
209 /// terminal marker even when no final model turn runs.
210 SessionClosed {
211 session_id: String,
212 reason: String,
213 status: String,
214 metadata: serde_json::Value,
215 },
216 /// Emitted when `agent_session_reanchor` swaps the primary workspace
217 /// anchor (#2218). Hosts use this to drive cross-project handoff UX.
218 /// Carries the previous and current anchors so consumers can diff
219 /// without re-fetching session state.
220 AnchorChanged {
221 session_id: String,
222 previous: Option<serde_json::Value>,
223 current: serde_json::Value,
224 carry_transcript: bool,
225 compacted: bool,
226 reason: Option<String>,
227 },
228 JudgeDecision {
229 session_id: String,
230 iteration: usize,
231 verdict: String,
232 reasoning: String,
233 next_step: Option<String>,
234 judge_duration_ms: u64,
235 #[serde(default, skip_serializing_if = "Option::is_none")]
236 trigger: Option<String>,
237 },
238 /// Per-step critique decision emitted by `agent_step_judge`.
239 /// Sibling of [`JudgeDecision`] but fired BEFORE tool dispatch on
240 /// every assistant turn (when configured), not just at completion.
241 /// `on_veto` carries the configured remediation shape
242 /// (`"replace"` or `"retain"`); `cost_usd` is best-effort from the
243 /// stdlib economics estimator and may be 0 when pricing is unknown.
244 /// `skipped` marks configured short-circuits that did not call the
245 /// judge model.
246 StepJudgeDecision {
247 session_id: String,
248 iteration: usize,
249 verdict: String,
250 reasoning: String,
251 critique: String,
252 confidence: f64,
253 judge_duration_ms: u64,
254 vetoed: bool,
255 #[serde(default, skip_serializing_if = "std::ops::Not::not")]
256 skipped: bool,
257 #[serde(default, skip_serializing_if = "Option::is_none")]
258 reason: Option<String>,
259 /// True when this `verdict: "pass"` is the result of the step-judge
260 /// model itself erroring and `fail_open` swallowing the error — the
261 /// turn proceeded, but the adversarial-review surface was UNAVAILABLE
262 /// (not a genuine approval). Lets telemetry tell an inert reviewer
263 /// apart from a real pass. Mirrors `reason: "judge_unavailable"`.
264 #[serde(default, skip_serializing_if = "std::ops::Not::not")]
265 judge_error: bool,
266 on_veto: String,
267 input_tokens: u64,
268 output_tokens: u64,
269 cost_usd: f64,
270 provider: String,
271 model: String,
272 },
273 /// Deterministic pre-dispatch critique emitted by the structural
274 /// validator middleware. Fires before any LLM-backed judge so hosts
275 /// can distinguish "$0 structural retry" from semantic critique.
276 StructuralValidatorDecision {
277 session_id: String,
278 iteration: usize,
279 rule: String,
280 diagnostic: String,
281 recommended_action: String,
282 vetoed: bool,
283 #[serde(default, skip_serializing_if = "std::ops::Not::not")]
284 skipped: bool,
285 #[serde(default, skip_serializing_if = "Option::is_none")]
286 reason: Option<String>,
287 on_failure: String,
288 attempts: usize,
289 max_attempts: usize,
290 },
291 ScopeClassifierVerdict {
292 session_id: String,
293 iteration: usize,
294 label: String,
295 original_label: String,
296 confidence: f64,
297 confidence_threshold: f64,
298 evidence: String,
299 skip_main_turn: bool,
300 #[serde(default, skip_serializing_if = "Option::is_none")]
301 classifier_kind: Option<String>,
302 #[serde(default, skip_serializing_if = "Option::is_none")]
303 model: Option<String>,
304 #[serde(default, skip_serializing_if = "Option::is_none")]
305 error: Option<String>,
306 },
307 MissingToolCallVerdict {
308 session_id: String,
309 iteration: usize,
310 action: String,
311 original_action: String,
312 tool_name: String,
313 confidence: f64,
314 confidence_threshold: f64,
315 evidence: String,
316 #[serde(default, skip_serializing_if = "Option::is_none")]
317 language: Option<String>,
318 #[serde(default, skip_serializing_if = "Option::is_none")]
319 classifier_kind: Option<String>,
320 #[serde(default, skip_serializing_if = "Option::is_none")]
321 model: Option<String>,
322 #[serde(default, skip_serializing_if = "Option::is_none")]
323 error: Option<String>,
324 },
325 TypedCheckpoint {
326 session_id: String,
327 checkpoint: serde_json::Value,
328 },
329 FeedbackInjected {
330 session_id: String,
331 kind: String,
332 content: String,
333 },
334 /// Emitted when the agent loop exhausts `max_iterations` without any
335 /// explicit break condition firing. Distinct from a natural "done" or
336 /// a "stuck" nudge-exhaustion: this is strictly a budget cap.
337 BudgetExhausted {
338 session_id: String,
339 max_iterations: usize,
340 #[serde(default, skip_serializing_if = "Option::is_none")]
341 kind: Option<String>,
342 #[serde(default, skip_serializing_if = "Option::is_none")]
343 cost_usd: Option<f64>,
344 #[serde(default, skip_serializing_if = "Option::is_none")]
345 wall_clock_ms: Option<u64>,
346 },
347 /// Emitted when a loop-level budget circuit breaker trips after N
348 /// consecutive retryable failures. `paused_for_ms` is the mock-time-aware
349 /// backoff already honored before the terminal budget event.
350 BudgetCircuitBreaker {
351 session_id: String,
352 kind: String,
353 consecutive_count: usize,
354 paused_for_ms: u64,
355 },
356 /// Emitted when the loop breaks because consecutive text-only turns
357 /// hit `max_nudges`. Parity with `BudgetExhausted` / `IterationEnd` for
358 /// hosts that key off agent-terminal events.
359 LoopStuck {
360 session_id: String,
361 max_nudges: usize,
362 last_iteration: usize,
363 tail_excerpt: String,
364 },
365 /// Pipeline-authored stuck/escalation signal emitted through
366 /// `agent_emit_event("loop_stuck", payload)`. The runtime-level
367 /// `LoopStuck` variant above remains the built-in max-nudge terminal event;
368 /// this variant preserves the pipeline payload so hosts can surface richer
369 /// handoff/escalation details without inventing another wire kind.
370 LoopStuckSignal {
371 session_id: String,
372 payload: serde_json::Value,
373 },
374 /// Emitted by the reserved-budget terminal-verify guard
375 /// (`agent_emit_event("reserved_terminal_verify", payload)`). The guard
376 /// holds back a small iteration reserve the main loop cannot consume; when
377 /// the loop would otherwise terminate on a budget/stuck boundary with an
378 /// unverified source write, it spends the reserve on a final verify(+repair)
379 /// instead of ending blind on a red build. The payload's `phase` field tags
380 /// the step (`grant` / `verify_passed` / `verify_failed`) so replayers and
381 /// operators can see the guard fire and its outcome. Payload-preserving like
382 /// `LoopStuckSignal` so the guard can carry richer detail without inventing
383 /// another wire kind.
384 ReservedTerminalVerify {
385 session_id: String,
386 payload: serde_json::Value,
387 },
388 /// Emitted when the daemon idle-wait loop trips its watchdog because
389 /// every configured wake source returned `None` for N consecutive
390 /// attempts. Exists so a broken daemon doesn't hang the session
391 /// silently.
392 DaemonWatchdogTripped {
393 session_id: String,
394 attempts: usize,
395 elapsed_ms: u64,
396 },
397 /// Emitted when a skill is activated. Carries the match reason so
398 /// replayers can reconstruct *why* a given skill took effect at
399 /// this iteration.
400 SkillActivated {
401 session_id: String,
402 skill_name: String,
403 iteration: usize,
404 reason: String,
405 },
406 /// Emitted when a previously-active skill is deactivated because
407 /// the reassess phase no longer matches it.
408 SkillDeactivated {
409 session_id: String,
410 skill_name: String,
411 iteration: usize,
412 },
413 /// Emitted once per activation when the skill's `allowed_tools` filter
414 /// narrows the effective tool surface exposed to the model.
415 SkillScopeTools {
416 session_id: String,
417 skill_name: String,
418 allowed_tools: Vec<String>,
419 },
420 /// Emitted when the agent loop ratchets the model-visible tool
421 /// surface narrower after observing recent tool-call usage. Unlike
422 /// `SkillScopeTools`, this is session-local and can only remove
423 /// tools from the currently-effective surface.
424 SkillNarrow {
425 session_id: String,
426 reason: String,
427 removed_tools: Vec<String>,
428 remaining_tools: Vec<String>,
429 #[serde(default, skip_serializing_if = "serde_json::Value::is_null")]
430 policy: serde_json::Value,
431 #[serde(default, skip_serializing_if = "serde_json::Value::is_null")]
432 removed_tool_details: serde_json::Value,
433 #[serde(default, skip_serializing_if = "serde_json::Value::is_null")]
434 kept_tool_details: serde_json::Value,
435 },
436 /// Read-only stance lifecycle (std/agent/stance): `phase` is one of
437 /// `armed`, `write_access_granted`, `write_access_denied`,
438 /// `disarmed`. Arming carries the permitted tool window; the
439 /// grant/deny phases carry the escape-hatch justification and the
440 /// consent verdict so a trace viewer can explain every elevation.
441 StanceTransition {
442 session_id: String,
443 phase: String,
444 escape_tool: String,
445 #[serde(default, skip_serializing_if = "Vec::is_empty")]
446 allowed_tools: Vec<String>,
447 #[serde(default, skip_serializing_if = "String::is_empty")]
448 justification: String,
449 #[serde(default, skip_serializing_if = "String::is_empty")]
450 consent: String,
451 #[serde(default, skip_serializing_if = "String::is_empty")]
452 reason: String,
453 },
454 /// Emitted when a `tool_search` query is issued by the model. Carries
455 /// the raw query args, the configured strategy, and a `mode` tag
456 /// distinguishing the client-executed fallback (`"client"`) from
457 /// provider-native paths (`"anthropic"` / `"openai"`). Mirrors the
458 /// transcript event shape so hosts can render a search-in-progress
459 /// chip in real time — the replay path walks the transcript after
460 /// the turn, which is too late for live UX.
461 ToolSearchQuery {
462 session_id: String,
463 tool_use_id: String,
464 name: String,
465 query: serde_json::Value,
466 strategy: String,
467 mode: String,
468 },
469 /// Emitted when `tool_search` resolves — carries the list of tool
470 /// names newly promoted into the model's effective surface for the
471 /// next turn. Pair-emitted with `ToolSearchQuery` on every search.
472 ToolSearchResult {
473 session_id: String,
474 tool_use_id: String,
475 promoted: Vec<String>,
476 strategy: String,
477 mode: String,
478 },
479 TranscriptCompacted {
480 session_id: String,
481 mode: String,
482 reason: String,
483 strategy: String,
484 archived_messages: usize,
485 estimated_tokens_before: usize,
486 estimated_tokens_after: usize,
487 snapshot_asset_id: Option<String>,
488 #[serde(default, skip_serializing_if = "Option::is_none")]
489 instruction_mode: Option<String>,
490 #[serde(default, skip_serializing_if = "Option::is_none")]
491 instruction_source: Option<String>,
492 #[serde(default, skip_serializing_if = "Option::is_none")]
493 compaction_policy: Option<serde_json::Value>,
494 },
495 /// Emitted whenever `transcript_project` derives a model-visible
496 /// prefix from the immutable raw transcript. Hosts that render a
497 /// side-by-side raw/projected view subscribe to this — the typed
498 /// payload mirrors the metadata on the persisted
499 /// `transcript.projection` transcript event so clients don't have to
500 /// re-parse the transcript to sync UI state.
501 TranscriptProjected {
502 session_id: String,
503 policy: String,
504 reason: String,
505 prefix_hash: String,
506 kept_count: usize,
507 dropped_count: usize,
508 provider_safety_blocked: bool,
509 #[serde(default, skip_serializing_if = "is_zero_usize")]
510 redacted_count: usize,
511 #[serde(default, skip_serializing_if = "is_zero_usize")]
512 reclaimed_tokens: usize,
513 #[serde(default, skip_serializing_if = "Vec::is_empty")]
514 roots_consulted: Vec<String>,
515 #[serde(default, skip_serializing_if = "Vec::is_empty")]
516 redaction_pointers: Vec<serde_json::Value>,
517 },
518 /// Emitted when a pending `system_reminder` is rendered into the
519 /// next provider request. ACP clients show these in a reminder lane
520 /// instead of mixing them into assistant text chunks.
521 ReminderEmitted {
522 session_id: String,
523 reminder_id: String,
524 tags: Vec<String>,
525 body: String,
526 role_hint: String,
527 rendered_role: String,
528 source: String,
529 ttl_turns: Option<i64>,
530 },
531 Handoff {
532 session_id: String,
533 artifact_id: String,
534 handoff: Box<HandoffArtifact>,
535 },
536 FsWatch {
537 session_id: String,
538 subscription_id: String,
539 events: Vec<FsWatchEvent>,
540 },
541 /// Emitted when hostlib staged filesystem state changes for a session.
542 /// The ACP adapter maps this to the existing `progress` extension so
543 /// clients can update rollup-diff badges without waiting for a prompt
544 /// turn boundary.
545 StagedWritesPending {
546 session_id: String,
547 pending_count: usize,
548 total_bytes: u64,
549 },
550 /// Per-call outcome of `hostlib_fs_safe_text_patch`. Hosts subscribe to
551 /// this to roll up stale-base / hunk-conflict rates and average
552 /// hunks-per-patch without scraping result dicts out of pipeline logs.
553 /// Fired from both the staged-overlay and direct-disk code paths so
554 /// the rollup is comprehensive.
555 SafeTextPatchResult {
556 session_id: String,
557 path: String,
558 result: String,
559 hunks_count: usize,
560 bytes_written: u64,
561 #[serde(default, skip_serializing_if = "Option::is_none")]
562 failed_hunk_index: Option<usize>,
563 },
564 /// ACP control-plane arbitration outcome. Emitted for accepted,
565 /// idempotent, and rejected controls so replay/audit consumers can show
566 /// who acted and why a late or unauthorized action lost.
567 ControlOutcome {
568 session_id: String,
569 control_id: String,
570 method: String,
571 outcome: String,
572 status: String,
573 actor: serde_json::Value,
574 target: serde_json::Value,
575 #[serde(default, skip_serializing_if = "Option::is_none")]
576 reason: Option<String>,
577 #[serde(default, skip_serializing_if = "serde_json::Value::is_null")]
578 metadata: serde_json::Value,
579 },
580 /// Lifecycle update for a delegated/background worker. Carries the
581 /// canonical typed `event` variant alongside the worker's current
582 /// `status` string and the structured `metadata` payload that
583 /// `worker_bridge_metadata` builds (task, mode, timing, child
584 /// run/snapshot paths, audit-session, etc.). The `audit` field is
585 /// the same `MutationSessionRecord` JSON serialization carried on
586 /// the bridge wire so ACP/A2A consumers don't need to re-derive it.
587 ///
588 /// One-to-one with the bridge-side `worker_update` session-update
589 /// notification: ACP and A2A adapters subscribe to this variant
590 /// and translate it into their respective wire formats. The
591 /// `session_id` is the parent agent session that owns the worker
592 /// (i.e. the session whose VM spawned the worker), so a single
593 /// host stays subscribed to the same sink for both message and
594 /// worker traffic.
595 WorkerUpdate {
596 session_id: String,
597 worker_id: String,
598 worker_name: String,
599 worker_task: String,
600 worker_mode: String,
601 event: WorkerEvent,
602 status: String,
603 metadata: serde_json::Value,
604 audit: Option<serde_json::Value>,
605 },
606 /// A human-in-the-loop primitive (`ask_user`, `request_approval`,
607 /// `dual_control`, `escalate`) has just suspended the script and is
608 /// waiting on a response. Hosts that bridge the VM onto a remote
609 /// transport (ACP, A2A) translate this into a "paused / awaiting
610 /// input" wire signal so the client knows the task isn't stuck —
611 /// it's blocked on the human side. Pair-emitted with `HitlResolved`
612 /// when the waitpoint completes/cancels/times out.
613 HitlRequested {
614 session_id: String,
615 request_id: String,
616 kind: String,
617 payload: serde_json::Value,
618 },
619 /// Companion to `HitlRequested`: the waitpoint has resolved (either
620 /// a response arrived, the deadline elapsed, or the request was
621 /// cancelled). `outcome` is one of `"answered"`, `"timeout"`,
622 /// `"cancelled"`. Hosts use this to flip task state back to
623 /// `working` after an `input-required` pause.
624 HitlResolved {
625 session_id: String,
626 request_id: String,
627 kind: String,
628 outcome: String,
629 },
630 /// Emitted by the agent loop's adaptive iteration budget /
631 /// `loop_control` policy when a budget extension or early stop fires.
632 /// Generic enough to cover both shapes — `action` distinguishes them.
633 /// Carries the iteration the decision applied to, the previous /
634 /// resulting iteration limit, the policy reason string, and (for
635 /// stops) the loop status.
636 LoopControlDecision {
637 session_id: String,
638 iteration: usize,
639 action: String,
640 old_limit: usize,
641 new_limit: usize,
642 reason: String,
643 status: String,
644 },
645 /// Emitted when `agent_loop` detects adjacent repeated tool calls with
646 /// identical arguments. The warning payload avoids raw arguments by
647 /// default and carries digests so hosts can correlate repeats without
648 /// exposing potentially sensitive tool inputs.
649 AgentLoopStallWarning {
650 session_id: String,
651 warning: serde_json::Value,
652 },
653 /// Emitted when a concrete provider/model pair lacks a catalog
654 /// recommendation for a capability and the runtime chooses a fallback.
655 CapabilityGap {
656 session_id: String,
657 level: String,
658 capability: String,
659 provider: String,
660 model: String,
661 fallback_tool_format: String,
662 #[serde(default, skip_serializing_if = "Option::is_none")]
663 requested_tool_format: Option<String>,
664 message: String,
665 },
666 /// Emitted when a caller explicitly forces a tool format that
667 /// differs from the capability catalog's recommendation or known
668 /// native/text parity guidance.
669 ToolFormatOverride {
670 session_id: String,
671 provider: String,
672 model: String,
673 requested_format: String,
674 recommended_format: String,
675 catalog_parity: String,
676 #[serde(default, skip_serializing_if = "Option::is_none")]
677 override_reason: Option<String>,
678 },
679 /// Emitted when a `tool_caller` middleware (see std/llm/tool_middleware)
680 /// attaches structured audit metadata to a tool call — typically a
681 /// user-facing `summary`, a `description`, an ACP-style `kind`, an MCP
682 /// `hints` block, a `consent` decision, the per-layer `layers` log, or
683 /// free-form `metadata` keys (A2A-style extension slot).
684 ///
685 /// One-to-one with the underlying tool-call: hosts can join on
686 /// `tool_call_id` to render middleware-attached chips alongside the
687 /// existing `ToolCall` / `ToolCallUpdate` stream. The `audit` payload
688 /// is intentionally free-form JSON so middleware can carry whatever
689 /// shape the harness author chooses without needing protocol-level
690 /// changes per new middleware. When present, `receipt` carries the
691 /// stable typed, privacy-preserving record hosts can persist or mirror.
692 ToolCallAudit {
693 session_id: String,
694 tool_call_id: String,
695 tool_name: String,
696 audit: serde_json::Value,
697 #[serde(default, skip_serializing_if = "Option::is_none")]
698 receipt: Option<ToolCallReceipt>,
699 },
700 /// Emitted by `std/cache::with_cache` (both the generic and LLM
701 /// forms) when a cached lookup returns a hit. Carries the
702 /// content-addressed key, the backend that served the value, and a
703 /// `metrics` block with the cost-moat receipts the persona value
704 /// ledger (a cloud platform) and crystallization receipts read:
705 /// `model_calls_avoided`, plus `tokens_saved` / `latency_saved_ms`
706 /// when the cached envelope carried `usage` / `latency_ms`.
707 CacheHit {
708 session_id: String,
709 key: String,
710 backend: String,
711 namespace: String,
712 payload: serde_json::Value,
713 },
714 /// Paired with `CacheHit`. Emitted on the miss path when the
715 /// fresh result is stored. `payload.metrics.compute_ms` carries
716 /// the wall-clock cost of the underlying computation, which
717 /// callers can feed back as `estimate.latency_saved_ms` on the
718 /// next hit.
719 CacheMiss {
720 session_id: String,
721 key: String,
722 backend: String,
723 namespace: String,
724 payload: serde_json::Value,
725 },
726 /// A language-neutral tool-composition snippet has started. The envelope
727 /// identifies the snippet and binding manifest hashes plus the side-effect
728 /// ceiling requested for the whole parent run.
729 CompositionStart {
730 session_id: String,
731 run: CompositionRunEnvelope,
732 },
733 /// A composition snippet is dispatching a child binding call. The child
734 /// remains visible as its own operation with annotations and policy context
735 /// instead of being hidden inside the parent composition blob.
736 CompositionChildCall {
737 session_id: String,
738 call: CompositionChildCall,
739 },
740 /// A child binding operation emitted a status/result update.
741 CompositionChildResult {
742 session_id: String,
743 result: CompositionChildResult,
744 },
745 /// A composition run finished successfully and carries stdout/stderr,
746 /// artifacts, and the structured result in the terminal envelope.
747 CompositionFinish {
748 session_id: String,
749 run: CompositionRunEnvelope,
750 },
751 /// A composition run failed before producing a successful terminal result.
752 /// The terminal envelope carries the failure category and optional error.
753 CompositionError {
754 session_id: String,
755 run: CompositionRunEnvelope,
756 },
757 /// Emitted once per `__agent_loop_checkpoint(...)` pass. The single
758 /// named seam through which the agent loop drains queued bridge
759 /// injections and inbox feedback. Hosts use it to debug "did the
760 /// loop check for steering at the expected boundary" without having
761 /// to grep the loop body for inline drain calls.
762 ///
763 /// `kind` is one of the documented seam names: `iteration_start`,
764 /// `pre_tool_dispatch`, `post_tool_dispatch`, `iteration_end`,
765 /// `pre_compact`, `post_compact`, `daemon_idle_pre`,
766 /// `daemon_idle_post`, `loop_exit`. `delivered` is the count of
767 /// bridge injections drained at this seam (inbox drains are
768 /// reported separately under `inbox_delivered`). `dispatch_skipped`
769 /// is true only when an `interrupt_immediate` injection arrived at
770 /// `pre_tool_dispatch` and the pending tool batch was skipped.
771 LoopCheckpoint {
772 session_id: String,
773 iteration: usize,
774 kind: String,
775 delivered: usize,
776 #[serde(default, skip_serializing_if = "is_zero_usize")]
777 inbox_delivered: usize,
778 #[serde(default, skip_serializing_if = "std::ops::Not::not")]
779 dispatch_skipped: bool,
780 },
781 /// Surfaced when Harn is acting as an MCP **client** and a peer
782 /// server sends a server-to-client message during an agent session:
783 /// a `notifications/progress` / `notifications/message` /
784 /// `notifications/*/list_changed` notification, or an inbound
785 /// `elicitation/create` / `sampling/createMessage` request.
786 ///
787 /// Emitted alongside (not in place of) the existing agent-inbox
788 /// relay so a thin ACP client can render a live progress bar, log
789 /// line, elicitation prompt, or sampling affordance without parsing
790 /// the inbox transcript. `direction` is `"notification"` for
791 /// fire-and-forget server notifications and `"request"` for inbound
792 /// requests that still resolve through the existing client-role
793 /// dispatch path (this event does not change that response). `method`
794 /// is the raw MCP JSON-RPC method; `params` is its untouched payload.
795 McpNotification {
796 session_id: String,
797 server: String,
798 method: String,
799 direction: String,
800 params: serde_json::Value,
801 },
802 /// Surfaced when the effective MCP catalog changes — either because a
803 /// server emitted a `notifications/tools/list_changed` (or the
804 /// resource/prompt equivalents), or because the persisted enable/disable
805 /// allowlist was edited. A thin ACP client (an IDE host's TUI / GUI)
806 /// treats this as a cue to re-fetch the catalog (e.g. via the
807 /// `mcp/catalog` request) and re-render its toggle UI, rather than
808 /// reconciling any local state. `server` is the server whose list
809 /// changed, or `None` when the change is allowlist-wide. `reason` is a
810 /// short tag (`"list_changed"` or `"allowlist_updated"`).
811 McpCatalogChanged {
812 session_id: String,
813 #[serde(default, skip_serializing_if = "Option::is_none")]
814 server: Option<String>,
815 reason: String,
816 },
817 /// Surfaced when an MCP server harn is acting as a client for answers a
818 /// request with `401 Unauthorized` mid-session, meaning its OAuth token is
819 /// missing or expired. This is a cue for a thin ACP client (an IDE host's
820 /// TUI / GUI) to start an authorization: call `mcp/authorize` to mint a
821 /// browser URL, open it, and forward the redirect's `code`+`state` back via
822 /// `mcp/oauth_callback`. Token exchange and storage stay in harn. `server`
823 /// is the configured server name; `resource` is its canonical RFC 8707
824 /// resource indicator; `scope` is the `scope` parameter from the
825 /// `WWW-Authenticate` challenge, when present.
826 McpAuthRequired {
827 session_id: String,
828 server: String,
829 resource: String,
830 #[serde(default, skip_serializing_if = "Option::is_none")]
831 scope: Option<String>,
832 },
833}
834
835fn is_zero_usize(value: &usize) -> bool {
836 *value == 0
837}
838
839impl AgentEvent {
840 pub fn session_id(&self) -> &str {
841 match self {
842 Self::AgentMessageChunk { session_id, .. }
843 | Self::AgentThoughtChunk { session_id, .. }
844 | Self::UserMessage { session_id, .. }
845 | Self::ToolCall { session_id, .. }
846 | Self::ToolCallUpdate { session_id, .. }
847 | Self::Plan { session_id, .. }
848 | Self::ProgressReported { session_id, .. }
849 | Self::CompassRoutingDecision { session_id, .. }
850 | Self::AgentScratchpadReorganization { session_id, .. }
851 | Self::Artifact { session_id, .. }
852 | Self::IterationStart { session_id, .. }
853 | Self::IterationEnd { session_id, .. }
854 | Self::SessionClosed { session_id, .. }
855 | Self::AnchorChanged { session_id, .. }
856 | Self::JudgeDecision { session_id, .. }
857 | Self::StepJudgeDecision { session_id, .. }
858 | Self::StructuralValidatorDecision { session_id, .. }
859 | Self::ScopeClassifierVerdict { session_id, .. }
860 | Self::MissingToolCallVerdict { session_id, .. }
861 | Self::TypedCheckpoint { session_id, .. }
862 | Self::FeedbackInjected { session_id, .. }
863 | Self::BudgetExhausted { session_id, .. }
864 | Self::BudgetCircuitBreaker { session_id, .. }
865 | Self::LoopStuck { session_id, .. }
866 | Self::LoopStuckSignal { session_id, .. }
867 | Self::ReservedTerminalVerify { session_id, .. }
868 | Self::DaemonWatchdogTripped { session_id, .. }
869 | Self::SkillActivated { session_id, .. }
870 | Self::SkillDeactivated { session_id, .. }
871 | Self::SkillScopeTools { session_id, .. }
872 | Self::SkillNarrow { session_id, .. }
873 | Self::StanceTransition { session_id, .. }
874 | Self::ToolSearchQuery { session_id, .. }
875 | Self::ToolSearchResult { session_id, .. }
876 | Self::TranscriptCompacted { session_id, .. }
877 | Self::TranscriptProjected { session_id, .. }
878 | Self::ReminderEmitted { session_id, .. }
879 | Self::Handoff { session_id, .. }
880 | Self::FsWatch { session_id, .. }
881 | Self::StagedWritesPending { session_id, .. }
882 | Self::SafeTextPatchResult { session_id, .. }
883 | Self::ControlOutcome { session_id, .. }
884 | Self::WorkerUpdate { session_id, .. }
885 | Self::HitlRequested { session_id, .. }
886 | Self::HitlResolved { session_id, .. }
887 | Self::LoopControlDecision { session_id, .. }
888 | Self::AgentLoopStallWarning { session_id, .. }
889 | Self::CapabilityGap { session_id, .. }
890 | Self::ToolFormatOverride { session_id, .. }
891 | Self::ToolCallAudit { session_id, .. }
892 | Self::CacheHit { session_id, .. }
893 | Self::CacheMiss { session_id, .. }
894 | Self::CompositionStart { session_id, .. }
895 | Self::CompositionChildCall { session_id, .. }
896 | Self::CompositionChildResult { session_id, .. }
897 | Self::CompositionFinish { session_id, .. }
898 | Self::CompositionError { session_id, .. }
899 | Self::LoopCheckpoint { session_id, .. }
900 | Self::McpNotification { session_id, .. }
901 | Self::McpCatalogChanged { session_id, .. }
902 | Self::McpAuthRequired { session_id, .. } => session_id,
903 }
904 }
905}