aristo-cli 0.2.3

Aristo CLI binary (the `aristo` command).
Documentation
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
//! `aristo nudge` — the nudge/progress engine's union function + surfaces
//! (Phase 18 #9, S0d). With no `--event` it prints what the engine would
//! surface (human introspection); with `--event <post-tool-use|
//! user-prompt-submit|session-start>` it runs as a Claude Code hook emitter
//! and ALWAYS exits 0 (a nudge must never break the agent).
//!
//! **Surface contract (v2, validated by the S0a spike — corrects SPINE-PLAN
//! D10).** A hook only reaches the agent's context via
//! `hookSpecificOutput.additionalContext` JSON — a plain `<system-reminder>`
//! to stdout lands in the transcript but NOT in the model's context (proven:
//! the old Stop/PostToolUse plain-stdout reminders never reached the agent;
//! the SessionStart additionalContext did). And `Stop` does not deliver at
//! all. So every surface here emits `additionalContext`, and the per-turn
//! human nudge rides `UserPromptSubmit` (fires at the start of every turn,
//! incl. the first — reliably reaches the agent without forcing continuation).
//! `Stop` is dropped (an old `--event stop` parses as unknown → silent).
//! `SessionStart` is compute-only: it captures the edit-window baseline and
//! resets the counter, surfacing nothing (the next `UserPromptSubmit` carries
//! the backlog). The ambient user-facing surface is `aristo statusline`.
//!
//! The union function [`build_inputs`] is the COMPUTE join the scorer reads:
//! the index-derived [`Metrics`] plus the runtime facts only the cli can see
//! (reviewed map, proof-reviewed map, edit-window baseline, sign-in). It is
//! read-only and never fails the caller on missing pieces — a nudge surface
//! must degrade quietly, never break a workflow.

use std::io::Read;

use aristo_core::config::{Aggressiveness, ConfigFile};
use aristo_core::metrics::Metrics;
use aristo_core::walk::{count_fns_per_module_with, WalkOptions};

use crate::commands::index::workspace_or_error;
use crate::commands::show::read_index;
use crate::nudge::state::{Baseline, NudgeState, STATE_FILENAME};
use crate::nudge::{score, throttle, Audience, Decision, EngineInputs};
use crate::{CliError, CliResult, Workspace};

/// Which Claude Code hook event this invocation is serving (or `None` for the
/// human introspection readout).
#[derive(Debug, Clone, Copy, PartialEq, Eq)]
enum HookEvent {
    PostToolUse,
    UserPromptSubmit,
    SessionStart,
}

fn parse_event(raw: &str) -> Option<HookEvent> {
    match raw {
        "post-tool-use" | "PostToolUse" => Some(HookEvent::PostToolUse),
        "user-prompt-submit" | "UserPromptSubmit" => Some(HookEvent::UserPromptSubmit),
        "session-start" | "SessionStart" => Some(HookEvent::SessionStart),
        // `stop`/`Stop` deliberately unhandled → silent: a Stop hook's stdout
        // never reaches the agent, so the per-turn nudge moved to
        // UserPromptSubmit. An already-installed `--event stop` no-ops here.
        _ => None,
    }
}

pub(crate) fn run(event: Option<String>) -> CliResult<()> {
    let ws = workspace_or_error()?;
    let config = ws.load_config();
    let aggressiveness = config.nudges.aggressiveness;

    // No --event → human introspection readout (the only mode that prints to
    // a human and may surface an error).
    let Some(raw) = event else {
        let state = NudgeState::load(&ws.aristo_dir().join(STATE_FILENAME));
        let inputs = build_inputs(&ws, &config, &state)?;
        let decision = score(&inputs, aggressiveness);
        print_readout(&inputs, aggressiveness, &decision);
        return Ok(());
    };

    // Hook mode: a nudge hook must NEVER break the agent. Swallow every error
    // and exit 0 — the worst case is "no nudge this turn".
    let _ = emit_for_event(&ws, &config, aggressiveness, &raw);
    Ok(())
}

fn emit_for_event(
    ws: &Workspace,
    config: &ConfigFile,
    aggressiveness: Aggressiveness,
    raw_event: &str,
) -> CliResult<()> {
    let Some(event) = parse_event(raw_event) else {
        return Ok(()); // unknown event → silent
    };
    let state_path = ws.aristo_dir().join(STATE_FILENAME);
    let mut state = NudgeState::load(&state_path);
    let now = now_epoch();

    match event {
        HookEvent::PostToolUse => {
            // Count edit-like tool calls toward the authoring-debt signal.
            if stdin_tool_is_edit() {
                state.edits_since_annotation = state.edits_since_annotation.saturating_add(1);
                let _ = state.save(&state_path);
            }
            if aggressiveness.is_off() {
                return Ok(());
            }
            // authoring_debt scores off the counter alone — NO build_inputs /
            // source walk (this hook fires on every edit; it must stay cheap).
            // Agent surface via additionalContext (the only channel that
            // reaches the agent); throttled so it doesn't nag once over the
            // threshold.
            let edits = state.edits_since_annotation;
            if let Some(f) = crate::nudge::score_authoring_debt(edits, aggressiveness) {
                if throttle::may_surface(
                    state.throttle.get(f.id),
                    now,
                    aggressiveness,
                    f.metric,
                    f.base,
                ) {
                    print_additional_context("PostToolUse", &authoring_debt_context(edits));
                    state.throttle.insert(
                        f.id.to_string(),
                        throttle::record_after_surface(now, f.metric),
                    );
                    let _ = state.save(&state_path);
                }
            }
        }
        HookEvent::UserPromptSubmit => {
            // The consolidated human nudge — at the START of each turn (incl.
            // the first), reaching the agent via additionalContext without
            // forcing continuation. Surface if ANY fired human signal clears
            // its throttle; the cooldown gates per-turn spam.
            if aggressiveness.is_off() {
                return Ok(());
            }
            let inputs = build_inputs(ws, config, &state)?;
            let decision = score(&inputs, aggressiveness);
            let cleared: Vec<crate::nudge::Fired> = decision
                .human
                .iter()
                .filter(|f| {
                    throttle::may_surface(
                        state.throttle.get(f.id),
                        now,
                        aggressiveness,
                        f.metric,
                        f.base,
                    )
                })
                .cloned()
                .collect();
            if !cleared.is_empty() {
                print_additional_context(
                    "UserPromptSubmit",
                    &review_nudge_context(&decision, &inputs),
                );
                for f in &cleared {
                    state.throttle.insert(
                        f.id.to_string(),
                        throttle::record_after_surface(now, f.metric),
                    );
                }
                let _ = state.save(&state_path);
            }
        }
        HookEvent::SessionStart => {
            // Compute-only: capture the edit-window baseline + reset the edit
            // counter. Surface NOTHING — the next UserPromptSubmit carries the
            // backlog (SessionStart surfacing is premature + once-only).
            let inputs = build_inputs(ws, config, &state)?;
            state.baseline = Some(Baseline {
                score: inputs.metrics.visible_score,
                tier: inputs.metrics.tier.label().to_string(),
            });
            // Snapshot the authored-intent id-set so #7 can split the review
            // backlog into new-this-session vs carried-over. Best-effort: if
            // the index can't be read, leave the window uncaptured (the split
            // is then suppressed, not guessed).
            state.window_intent_ids = read_index(&ws.index_path()).ok().map(|idx| {
                crate::nudge::intents::authored_intents(&idx)
                    .into_iter()
                    .map(|i| i.id)
                    .collect()
            });
            state.edits_since_annotation = 0;
            let _ = state.save(&state_path);
        }
    }
    Ok(())
}

fn now_epoch() -> u64 {
    time::OffsetDateTime::now_utc().unix_timestamp().max(0) as u64
}

/// Read the PostToolUse hook payload from stdin and decide whether the tool
/// was an edit-like (source-mutating) call. Tolerant: any parse failure or
/// absent stdin counts as "not an edit" (don't bump on uncertainty).
fn stdin_tool_is_edit() -> bool {
    let mut buf = String::new();
    if std::io::stdin().read_to_string(&mut buf).is_err() || buf.trim().is_empty() {
        return false;
    }
    let Ok(json) = serde_json::from_str::<serde_json::Value>(&buf) else {
        return false;
    };
    let tool = json.get("tool_name").and_then(|v| v.as_str()).unwrap_or("");
    matches!(tool, "Edit" | "Write" | "MultiEdit" | "NotebookEdit")
}

#[aristo::intent(
    "The union function is read-only and tolerant: it never mutates the \
     workspace and never fails the caller on missing runtime state. Absent \
     reviewed/proof-reviewed maps make everything read as unreviewed, an \
     absent baseline disables the gain/slump signals, and an unreadable \
     proofs dir contributes zero — degrade quietly. A nudge surface that \
     errored or wrote files would turn an advisory into a workflow blocker, \
     violating the engine's nudge-only posture (D3).",
    verify = "neural",
    id = "nudge_union_is_read_only_and_tolerant"
)]
/// Join the index-derived metrics with the cli-resident runtime signals into
/// the [`EngineInputs`] the scorer consumes. Read-only; tolerant of missing
/// state (the engine simply sees more as unreviewed / no baseline).
pub(crate) fn build_inputs(
    ws: &Workspace,
    config: &ConfigFile,
    state: &NudgeState,
) -> CliResult<EngineInputs> {
    let index = read_index(&ws.index_path())?;

    // Coverage denominator for the tier formula (read-only walk, as in badge).
    let fn_counts =
        count_fns_per_module_with(&ws.root, &WalkOptions::none()).map_err(|e| CliError::Other {
            message: format!("failed to walk source for metrics coverage: {e}"),
            exit_code: 1,
        })?;
    let metrics = Metrics::from_index(&index, &fn_counts, config.verify.default_method);

    // Unreviewed authored intents: every index intent the reviewed map doesn't
    // currently vouch for (absent, unmarked, or hash-drifted). The same
    // `authored_intents` enumeration `aristo review` reads, so the engine and
    // the review surface can never report a different backlog.
    let intents = crate::nudge::intents::authored_intents(&index);
    let unreviewed_intents = state.unreviewed_count(
        intents
            .iter()
            .map(|i| (i.id.as_str(), i.text_hash.as_str(), i.body_hash.as_str())),
    );

    let proofs_awaiting_review = count_proofs_awaiting(ws, state);

    let (prior_score, tier_increased) = match &state.baseline {
        Some(b) => (
            Some(b.score),
            metrics.tier.label() != b.tier && metrics.visible_score > b.score,
        ),
        None => (None, false),
    };

    // Local-only sign-in check (env var / config files; never network).
    let signed_in = aristo_core::auth::resolve_full().is_ok();

    // Canon matching is paid (#10): only read the local cache + suggestions
    // queue when signed in, so the canon signal does no work and stays silent
    // otherwise (no upsell spam). The reader is tolerant — errors yield 0.
    let canon_pending = if signed_in {
        crate::commands::canon::suggestions::pending_total(ws)
    } else {
        0
    };

    Ok(EngineInputs {
        metrics,
        edits_since_annotation: state.edits_since_annotation,
        unreviewed_intents,
        proofs_awaiting_review,
        canon_pending,
        prior_score,
        tier_increased,
        signed_in,
    })
}

/// Count `.aristo/proofs/<id>.proof` files whose verdict the proof-reviewed
/// map doesn't yet vouch for. Absent dir → 0.
fn count_proofs_awaiting(ws: &Workspace, state: &NudgeState) -> usize {
    let dir = ws.aristo_dir().join("proofs");
    let Ok(read) = std::fs::read_dir(&dir) else {
        return 0;
    };
    let mut n = 0usize;
    for entry in read.flatten() {
        let path = entry.path();
        if path.extension().and_then(|e| e.to_str()) != Some("proof") {
            continue;
        }
        let Some(stem) = path.file_stem().and_then(|s| s.to_str()) else {
            continue;
        };
        let id = stem.replace("__", ":");
        if !state.proof_reviewed.get(&id).copied().unwrap_or(false) {
            n += 1;
        }
    }
    n
}

fn print_readout(
    inputs: &EngineInputs,
    aggressiveness: aristo_core::config::Aggressiveness,
    decision: &crate::nudge::Decision,
) {
    println!("Aristo nudge engine — would-surface readout");
    println!("  aggressiveness: {aggressiveness:?}");
    println!(
        "  inputs: {} unreviewed · {} unverified/{} verifiable · {} proofs awaiting · score {:.2} ({})",
        inputs.unreviewed_intents,
        inputs.metrics.unverified,
        inputs.metrics.verifiable,
        inputs.proofs_awaiting_review,
        inputs.metrics.visible_score,
        inputs.metrics.tier.label(),
    );
    if decision.is_silent() {
        println!("  → nothing would fire.");
        return;
    }
    if let Some(rec) = decision.recommended() {
        println!("  → recommended: {rec}");
    }
    for fired in &decision.human {
        println!("  · [human] {} (pressure {:.2})", fired.id, fired.pressure);
    }
    for fired in &decision.agent {
        let _ = Audience::Agent; // audiences are surfaced on different channels
        println!("  · [agent] {} (pressure {:.2})", fired.id, fired.pressure);
    }
}

// ─── hook emit: the agent's context is reached ONLY via additionalContext ──
// A hook only injects into the model's context through
// `hookSpecificOutput.additionalContext` (the S0a spike proved a plain
// `<system-reminder>` to stdout does not). The CLI nudges the AGENT; the agent
// is the one that talks to the human (pops the review skill / AskUserQuestion).

#[aristo::intent(
    "A hook reaches the agent's context ONLY through \
     `hookSpecificOutput.additionalContext`; a plain string (even a literal \
     `<system-reminder>`) printed to a hook's stdout lands in the transcript \
     but never in the model's context (the S0a spike: the old Stop/PostToolUse \
     stdout reminders never reached the agent, the SessionStart \
     additionalContext did). Every agent-facing nudge MUST use this JSON \
     envelope — emitting bare text would be a silently-dead nudge.",
    verify = "test",
    id = "nudge_reaches_agent_only_via_additional_context"
)]
/// The Claude Code hook `additionalContext` envelope for `event_name` — the
/// only channel that injects into the agent's context.
fn additional_context_json(event_name: &str, context: &str) -> serde_json::Value {
    serde_json::json!({
        "hookSpecificOutput": {
            "hookEventName": event_name,
            "additionalContext": context,
        }
    })
}

/// Emit the `additionalContext` envelope to stdout.
fn print_additional_context(event_name: &str, context: &str) {
    println!("{}", additional_context_json(event_name, context));
}

/// PostToolUse agent nudge body: prod the coding agent to capture intent.
fn authoring_debt_context(edits: usize) -> String {
    format!(
        "Aristo: {edits} source edits since your last annotation. If any of \
         them embodied a non-obvious decision (a chosen invariant, a refactor \
         trap, an intentional-not-incomplete choice), capture it now with an \
         `aristo::intent` while the rationale is fresh — see the \
         aristo-authoring skill. Skip if the edits were purely mechanical."
    )
}

/// UserPromptSubmit consolidated nudge body: a hook can't pop an
/// AskUserQuestion, so it nudges the AGENT to offer the user the recommended
/// review at a natural pause. Subject-only — about the user's own
/// annotations/verification.
fn review_nudge_context(decision: &Decision, inputs: &EngineInputs) -> String {
    let mut context = format!("Aristo progress nudge — {}.", backlog_summary(inputs));
    if let Some(rec) = decision.recommended() {
        context.push_str(&format!(
            " At a natural pause, offer the user: {}. Don't interrupt mid-task.",
            recommended_phrase(rec)
        ));
    }
    context
}

/// A subject-only one-line summary of the standing backlog.
fn backlog_summary(inputs: &EngineInputs) -> String {
    let mut parts = Vec::new();
    if inputs.unreviewed_intents > 0 {
        parts.push(format!(
            "{} intent(s) await review",
            inputs.unreviewed_intents
        ));
    }
    if inputs.canon_pending > 0 {
        parts.push(format!(
            "{} canon match(es)/suggestion(s) pending",
            inputs.canon_pending
        ));
    }
    if inputs.metrics.unverified > 0 {
        parts.push(format!(
            "{} of {} intents unverified",
            inputs.metrics.unverified, inputs.metrics.verifiable
        ));
    }
    if inputs.proofs_awaiting_review > 0 {
        parts.push(format!(
            "{} proof(s) await review",
            inputs.proofs_awaiting_review
        ));
    }
    if parts.is_empty() {
        format!(
            "tier {} (score {:.2})",
            inputs.metrics.tier.label(),
            inputs.metrics.visible_score
        )
    } else {
        parts.join(" · ")
    }
}

/// Map a signal id to the low-friction action the agent should offer.
fn recommended_phrase(signal_id: &str) -> &'static str {
    match signal_id {
        "congrats" => "a quick note on the progress just made (tier/score went up)",
        "review_backlog" => {
            "an intent review — Critique-first runs in the background while you continue"
        }
        "canon_pending" => "a look at the pending canon matches (aristo-intent-suggestions)",
        "verify_backlog" => "running `aristo verify` (can run in the background)",
        "proof_review_backlog" => "a review of the freshly-verified proofs",
        "score_slump" => "shoring up coverage — annotate or verify to recover the score",
        _ => "a review of the outstanding aristo items",
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn additional_context_envelope_carries_event_and_context() {
        let v = additional_context_json("UserPromptSubmit", "hello backlog");
        assert_eq!(v["hookSpecificOutput"]["hookEventName"], "UserPromptSubmit");
        assert_eq!(
            v["hookSpecificOutput"]["additionalContext"],
            "hello backlog"
        );
        // It is JSON (the only channel that injects), NOT a bare <system-reminder>.
        let s = v.to_string();
        assert!(s.contains("hookSpecificOutput"));
        assert!(!s.contains("<system-reminder>"));
    }

    #[test]
    fn parse_event_drops_stop_and_keeps_the_v2_events() {
        assert_eq!(parse_event("post-tool-use"), Some(HookEvent::PostToolUse));
        assert_eq!(
            parse_event("user-prompt-submit"),
            Some(HookEvent::UserPromptSubmit)
        );
        assert_eq!(parse_event("session-start"), Some(HookEvent::SessionStart));
        // Stop is dropped — an already-installed `--event stop` no-ops silently.
        assert_eq!(parse_event("stop"), None);
        assert_eq!(parse_event("Stop"), None);
        assert_eq!(parse_event("nonsense"), None);
    }

    #[test]
    fn authoring_debt_context_names_the_count_and_the_skill() {
        let c = authoring_debt_context(4);
        assert!(c.contains("4 source edits"));
        assert!(c.contains("aristo-authoring"));
    }
}