rsclaw-agent 0.1.0

//! L1 memory extractor (docs/memory-extraction-redesign.md, Phase 3).
//!
//! Phase 1 stopped raw-note pollution, but with only deterministic entity
//! extraction (phone/ID/email) it also dropped soft durable signal like
//! "我叫东升" or "我喜欢简洁的回答". This module adds an LLM distillation pass
//! over the user message (a trusted source) that classifies durable knowledge
//! into the fixed kind taxonomy and writes only the salient results.
//!
//! Runs spawned/async so the per-turn flash call never delays the reply, and
//! only on turns that pass the cheap [`salience_gate`] so most chit-chat / task
//! requests never trigger an LLM call. All failures are logged and swallowed —
//! extraction is best-effort and must never break the turn.

use std::sync::Arc;

use tokio::sync::Mutex;

use crate::memory::{MemDocTier, MemoryDoc, MemoryStore, add_off_lock};
use rsclaw_provider::registry::ProviderRegistry;
use rsclaw_skill::crystallizer::{acquire_distill_permit, distill_with_llm};

/// Max L1 items written per turn — guards against a runaway model dumping
/// dozens of "facts" from a single message.
const MAX_ITEMS_PER_TURN: usize = 6;
/// Confidence floor. The model scores each item 0..1; drop the unsure ones.
const MIN_CONFIDENCE: f32 = 0.55;

/// Caps concurrent in-flight L1 extractions. A burst of "remember…" messages
/// would otherwise spawn unbounded tasks all queued on the distill permit,
/// each retaining its `user_text`. We `try_acquire` (never wait): over the cap,
/// L1 is skipped for that turn — best-effort by design, deterministic entity
/// capture is unaffected.
static L1_INFLIGHT: tokio::sync::Semaphore = tokio::sync::Semaphore::const_new(4);

/// Cheap, deterministic pre-gate. Returns true only when the message looks like
/// a first-person self-description or an explicit remember request — the cases
/// that carry durable soft signal. Questions, greetings, acks, and most task
/// requests fall through with zero LLM cost. Precision over recall by design:
/// deterministic entity extraction still catches phone/ID/email regardless of
/// whether this gate fires.
pub(crate) fn salience_gate(text: &str) -> bool {
    let t = text.trim();
    let n = t.chars().count();
    if n < 4 || n > 4000 {
        return false;
    }
    let lower = t.to_lowercase();
    const SIGNALS: &[&str] = &[
        // Chinese self-description / preference / relationship / imperative-remember.
        "我叫",
        "我是",
        "我的",
        "我家",
        "我住",
        "住在",
        "我用",
        "我习惯",
        "喜欢",
        "讨厌",
        "我想要",
        "我希望",
        "我们公司",
        "我老婆",
        "我妻子",
        "我太太",
        "我老公",
        "我儿子",
        "我女儿",
        "我爸",
        "我妈",
        "我生日",
        "记住",
        "记一下",
        "记下",
        "帮我记",
        "偏好",
        "以后每次",
        "每次都",
        // English.
        "my name",
        "my wife",
        "my husband",
        "i live",
        "i'm from",
        "i am ",
        "i'm ",
        "i like",
        "i prefer",
        "i hate",
        "i use ",
        "i work",
        "call me",
        "remember that",
        "remember to",
    ];
    SIGNALS.iter().any(|s| lower.contains(s))
}

/// Allowed L1 kinds → (tier, importance, pinned). Mirrors §2/§3 of the redesign
/// doc. An L1 `entity` (e.g. a name) is pinned Core like the deterministic
/// ones; the rest are Working. `note` is intentionally absent — L1 never
/// produces it.
fn kind_policy(kind: &str) -> Option<(MemDocTier, f32, bool)> {
    match kind {
        "entity" => Some((MemDocTier::Core, 0.9, true)),
        "preference" => Some((MemDocTier::Working, 0.72, false)),
        "procedure" => Some((MemDocTier::Working, 0.72, false)),
        "fact" => Some((MemDocTier::Working, 0.65, false)),
        "project_state" => Some((MemDocTier::Working, 0.65, false)),
        "relationship" => Some((MemDocTier::Working, 0.65, false)),
        // A lesson learned from a user correction. Core tier (slow decay,
        // near-permanent) but NOT pinned — a later, contradicting correction
        // should be able to supersede it rather than both lingering forever.
        "lesson" => Some((MemDocTier::Core, 0.85, false)),
        // A lesson inferred from the assistant's OWN failure (a detected tool
        // loop). Lower-confidence than a user correction — one stuck turn isn't
        // proof an approach is permanently bad — so Working tier (decays out if
        // it was a one-off) rather than Core.
        "failure" => Some((MemDocTier::Working, 0.6, false)),
        _ => None,
    }
}

/// Max lesson items per correction — a single correction rarely teaches more
/// than one or two durable rules.
const MAX_LESSON_ITEMS: usize = 2;

/// Cheap pre-gate for the lesson extractor: fires when the user message looks
/// like a correction of the assistant or a durable behavioral instruction.
/// Precision over recall — the LLM judge filters further and emits `[]` when
/// there's no durable lesson, so a loose match here only costs a skipped
/// flash call, never a bad memory.
pub(crate) fn correction_gate(text: &str) -> bool {
    let t = text.trim();
    let n = t.chars().count();
    if n < 2 || n > 4000 {
        return false;
    }
    let lower = t.to_lowercase();
    const SIGNALS: &[&str] = &[
        // Chinese correction / "do it this way from now on".
        "不对",
        "错了",
        "搞错",
        "弄错",
        "不是这",
        "不是我要",
        "我说的是",
        "应该是",
        "应该用",
        "别这样",
        "别用",
        "不要这样",
        "重新",
        "纠正",
        "下次",
        "以后不要",
        "以后别",
        "记住别",
        "不准",
        // English.
        "that's wrong",
        "thats wrong",
        "not what i",
        "not correct",
        "incorrect",
        "you should",
        "should have",
        "don't do",
        "do not do",
        "stop doing",
        "next time",
        "actually i meant",
        "i meant",
        "not like that",
        "redo",
        "you misunderstood",
    ];
    SIGNALS.iter().any(|s| lower.contains(s))
}

const LESSON_PROMPT: &str = "The user message below is reacting to the assistant. ONLY if it corrects a mistake the assistant made, or states a durable rule about how the assistant should behave or answer in future, capture that as a concise imperative lesson the assistant should follow next time. Ignore one-off task requests, questions, greetings, and venting that carry no reusable rule.\nOutput a JSON array; each element: {\"kind\":\"lesson\",\"text\":\"<concise imperative lesson, written about the assistant, preserving the user's language for specifics>\",\"confidence\":<number 0..1>}\nExamples of text: \"When the user asks for code, do not add explanatory comments unless asked\", \"回答用户时不要用表格，用要点列表\".\nIf there is no durable behavioral lesson, output an empty array []. Output ONLY JSON — no explanation, no code fences.\n\nUser message:\n";

const EXTRACTION_PROMPT: &str = "Extract durable, long-term-worthy information from the user message below. Capture only stable, reusable knowledge: identity, contact details, preferences, stable facts, project state, relationships between people/orgs, and reusable procedures. Ignore greetings, questions, one-off task requests, and emotional venting.\nCRITICAL: Use ONLY facts the user explicitly states in THIS message. Never infer, complete, guess, or invent any value — in particular do NOT fabricate emails, phone numbers, IDs, names, addresses, or dates (e.g. never output a placeholder like test@example.com). If a detail is not literally present in the message, omit it entirely.\nOutput a JSON array; each element: {\"kind\":\"<kind>\",\"text\":\"<concise third-person statement>\",\"confidence\":<number 0..1>}\nkind must be exactly one of: entity, preference, fact, project_state, relationship, procedure.\nWrite text in the third person and self-contained. CRITICAL: the text MUST be in the SAME language as the user message — if the user wrote in Chinese, the text MUST be in Chinese; if English, English. Never translate. Translating breaks keyword recall.\nExamples — Chinese in, Chinese out: \"用户名叫东升\", \"用户偏好简洁直接的回答\", \"用户最喜欢的车是 tesla\", \"用户的发布流程：cargo test，然后检查 UI，然后 commit\". English in, English out: \"User's name is John\", \"User prefers concise answers\".\nEvery item must include a numeric confidence in [0,1]. If nothing is worth remembering long-term, output an empty array []. Output ONLY JSON — no explanation, no code fences.\n\nUser message:\n";

/// Pre-insert dedup for extracted memories: exact text match within
/// (scope, kind) first, then semantic near-dup across kinds (Phase 4 —
/// catches the deterministic-phone vs L1-phone class of duplicate that
/// `find_exact` never could). A semantic hit refreshes the existing doc
/// (max-merge importance + recency bump) instead of inserting a sibling.
/// Returns true when the new item should be skipped.
async fn dedup_or_refresh(
    mem: &Arc<Mutex<MemoryStore>>,
    scope: &str,
    kind: &str,
    text: &str,
    importance: f32,
) -> bool {
    let threshold = crate::evolution::evolution_config()
        .meditation
        .dedup_threshold;
    let mut guard = mem.lock().await;
    if guard.find_exact(scope, kind, text).is_some() {
        return true;
    }
    if let Some((dup_id, sim)) = guard.find_semantic_dup(scope, text, threshold) {
        match guard.refresh_as_duplicate(&dup_id, importance) {
            Ok(true) => {
                tracing::debug!(%dup_id, sim, kind, "semantic dup — refreshed existing doc");
            }
            Ok(false) => {}
            Err(e) => tracing::warn!("semantic dup refresh failed: {e:#}"),
        }
        return true;
    }
    false
}

/// Spawn-friendly L1 extraction. Resolves the flash model, distills the user
/// message into structured candidates, and writes the salient ones (deduped via
/// `find_exact`).
pub(crate) async fn extract_l1(
    mem: Arc<Mutex<MemoryStore>>,
    providers: Arc<ProviderRegistry>,
    flash_model: String,
    scope: String,
    user_text: String,
) {
    // Bound in-flight L1 work. Over the cap we skip rather than queue, so a
    // burst of messages can't pile up tasks or retained text.
    let Ok(_inflight) = L1_INFLIGHT.try_acquire() else {
        tracing::debug!("L1 extract: at concurrency cap, skipping turn");
        return;
    };
    let (provider_name, model_id) = providers.resolve_model(&flash_model);
    let provider_arc = match providers.get(provider_name) {
        Ok(p) => p,
        Err(e) => {
            tracing::warn!(
                provider = provider_name,
                "L1 extract: provider not registered: {e:#}"
            );
            return;
        }
    };
    let _permit = match acquire_distill_permit().await {
        Ok(p) => p,
        Err(e) => {
            tracing::warn!("L1 extract: permit acquire failed: {e:#}");
            return;
        }
    };
    let prompt = format!("{EXTRACTION_PROMPT}{user_text}");
    let raw = match distill_with_llm(&prompt, provider_arc, model_id.to_owned()).await {
        Ok(s) => s,
        Err(e) => {
            tracing::warn!("L1 extract: LLM call failed: {e:#}");
            return;
        }
    };

    let items = parse_items(&raw);
    if items.is_empty() {
        tracing::debug!(scope = %scope, "L1 extract: nothing durable");
        return;
    }

    let mut written = 0usize;
    for item in items.into_iter().take(MAX_ITEMS_PER_TURN) {
        let Some((tier, importance, pinned)) = kind_policy(&item.kind) else {
            continue;
        };
        if item.confidence < MIN_CONFIDENCE {
            continue;
        }
        let text = item.text.trim().to_owned();
        if text.chars().count() < 3 {
            continue;
        }
        if dedup_or_refresh(&mem, &scope, &item.kind, &text, importance).await {
            continue;
        }
        let tags = if pinned {
            vec!["pinned".to_owned()]
        } else {
            vec![]
        };
        let doc = MemoryDoc {
            id: uuid::Uuid::new_v4().to_string(),
            scope: scope.clone(),
            kind: item.kind.clone(),
            text,
            vector: vec![],
            created_at: 0,
            accessed_at: 0,
            access_count: 0,
            importance,
            tier,
            abstract_text: None,
            overview_text: None,
            tags,
            pinned,
        };
        match add_off_lock(&mem, doc).await {
            Ok(_) => written += 1,
            Err(e) => tracing::warn!(kind = %item.kind, "L1 extract: add failed: {e:#}"),
        }
    }
    if written > 0 {
        tracing::info!(scope = %scope, written, "L1 memories extracted");
    }
}

/// Spawn-friendly lesson extraction from a user correction. Mirrors
/// [`extract_l1`] but uses the correction-focused prompt and writes only
/// `kind=lesson` items (Core tier, supersedable). Gated upstream by
/// [`correction_gate`]; best-effort, all failures logged and swallowed.
///
/// Source is the USER message only — never the assistant's own output — so we
/// don't crystallize the model's possibly-confabulated account of what it did
/// (the same trust boundary the per-turn entity/L1 paths respect).
pub(crate) async fn extract_lesson(
    mem: Arc<Mutex<MemoryStore>>,
    providers: Arc<ProviderRegistry>,
    flash_model: String,
    scope: String,
    user_text: String,
) {
    // Shares the L1 in-flight cap: lesson + L1 distills are both flash calls
    // and shouldn't pile up together.
    let Ok(_inflight) = L1_INFLIGHT.try_acquire() else {
        tracing::debug!("lesson extract: at concurrency cap, skipping turn");
        return;
    };
    let (provider_name, model_id) = providers.resolve_model(&flash_model);
    let provider_arc = match providers.get(provider_name) {
        Ok(p) => p,
        Err(e) => {
            tracing::warn!(
                provider = provider_name,
                "lesson extract: provider not registered: {e:#}"
            );
            return;
        }
    };
    let _permit = match acquire_distill_permit().await {
        Ok(p) => p,
        Err(e) => {
            tracing::warn!("lesson extract: permit acquire failed: {e:#}");
            return;
        }
    };
    let prompt = format!("{LESSON_PROMPT}{user_text}");
    let raw = match distill_with_llm(&prompt, provider_arc, model_id.to_owned()).await {
        Ok(s) => s,
        Err(e) => {
            tracing::warn!("lesson extract: LLM call failed: {e:#}");
            return;
        }
    };

    let items = parse_items(&raw);
    if items.is_empty() {
        tracing::debug!(scope = %scope, "lesson extract: no durable lesson");
        return;
    }

    let mut written = 0usize;
    for item in items.into_iter().take(MAX_LESSON_ITEMS) {
        // Only accept lesson items; ignore anything else the model emits.
        if item.kind != "lesson" {
            continue;
        }
        let Some((tier, importance, pinned)) = kind_policy("lesson") else {
            continue;
        };
        if item.confidence < MIN_CONFIDENCE {
            continue;
        }
        let text = item.text.trim().to_owned();
        if text.chars().count() < 3 {
            continue;
        }
        if dedup_or_refresh(&mem, &scope, "lesson", &text, importance).await {
            continue;
        }
        let doc = MemoryDoc {
            id: uuid::Uuid::new_v4().to_string(),
            scope: scope.clone(),
            kind: "lesson".to_owned(),
            text,
            vector: vec![],
            created_at: 0,
            accessed_at: 0,
            access_count: 0,
            importance,
            tier,
            abstract_text: None,
            overview_text: None,
            tags: vec![],
            pinned,
        };
        match add_off_lock(&mem, doc).await {
            Ok(_) => written += 1,
            Err(e) => tracing::warn!("lesson extract: add failed: {e:#}"),
        }
    }
    if written > 0 {
        tracing::info!(scope = %scope, written, "lesson memories extracted");
    }
}

/// Spawn-friendly failure-lesson extraction. Triggered when the agent loop
/// detected the assistant repeating a tool call without progress. Distills a
/// generalizable lesson from the user's TASK (trusted) plus a FACTUAL trace of
/// the looping tool call (the harness recorded what was actually invoked — this
/// is ground truth, not the assistant's prose account, so it stays on the right
/// side of the don't-crystallize-agent-output boundary).
///
/// Writes `kind=failure` (Working tier, decays). Best-effort; failures logged
/// and swallowed.
pub(crate) async fn extract_failure_lesson(
    mem: Arc<Mutex<MemoryStore>>,
    providers: Arc<ProviderRegistry>,
    flash_model: String,
    scope: String,
    task_text: String,
    failure_trace: String,
) {
    let Ok(_inflight) = L1_INFLIGHT.try_acquire() else {
        tracing::debug!("failure extract: at concurrency cap, skipping turn");
        return;
    };
    let (provider_name, model_id) = providers.resolve_model(&flash_model);
    let provider_arc = match providers.get(provider_name) {
        Ok(p) => p,
        Err(e) => {
            tracing::warn!(
                provider = provider_name,
                "failure extract: provider not registered: {e:#}"
            );
            return;
        }
    };
    let _permit = match acquire_distill_permit().await {
        Ok(p) => p,
        Err(e) => {
            tracing::warn!("failure extract: permit acquire failed: {e:#}");
            return;
        }
    };
    let prompt = format!(
        "The assistant got stuck repeating a tool call while handling the user's task and made no progress (a loop was detected). From the user's task and the factual trace of the repeated tool call below, extract a durable, GENERALIZABLE lesson — an approach that doesn't work for this kind of task and what to try instead. Do NOT just restate the error. If there is no generalizable lesson (e.g. a one-off transient glitch), output an empty array [].\nOutput a JSON array; each element: {{\"kind\":\"failure\",\"text\":\"<concise imperative lesson for next time>\",\"confidence\":<number 0..1>}}\nOutput ONLY JSON — no explanation, no code fences.\n\nUser task:\n{task_text}\n\nRepeated tool call (factual trace):\n{failure_trace}\n"
    );
    let raw = match distill_with_llm(&prompt, provider_arc, model_id.to_owned()).await {
        Ok(s) => s,
        Err(e) => {
            tracing::warn!("failure extract: LLM call failed: {e:#}");
            return;
        }
    };

    let items = parse_items(&raw);
    let mut written = 0usize;
    // At most one failure lesson per stuck turn.
    for item in items.into_iter().take(1) {
        if item.kind != "failure" || item.confidence < MIN_CONFIDENCE {
            continue;
        }
        let text = item.text.trim().to_owned();
        if text.chars().count() < 3 {
            continue;
        }
        let Some((tier, importance, pinned)) = kind_policy("failure") else {
            continue;
        };
        if dedup_or_refresh(&mem, &scope, "failure", &text, importance).await {
            continue;
        }
        let doc = MemoryDoc {
            id: uuid::Uuid::new_v4().to_string(),
            scope: scope.clone(),
            kind: "failure".to_owned(),
            text,
            vector: vec![],
            created_at: 0,
            accessed_at: 0,
            access_count: 0,
            importance,
            tier,
            abstract_text: None,
            overview_text: None,
            tags: vec![],
            pinned,
        };
        match add_off_lock(&mem, doc).await {
            Ok(_) => written += 1,
            Err(e) => tracing::warn!("failure extract: add failed: {e:#}"),
        }
    }
    if written > 0 {
        tracing::info!(scope = %scope, "failure lesson extracted");
    }
}

struct Item {
    kind: String,
    text: String,
    confidence: f32,
}

/// Parse model output into items. Tolerates code fences and either a JSON array
/// or one-object-per-line (JSON Lines). Unparseable content is skipped, never
/// fatal.
fn parse_items(raw: &str) -> Vec<Item> {
    let cleaned = strip_fences(raw);
    let mut out = Vec::new();
    // Try a single JSON array/value first.
    if let Ok(v) = serde_json::from_str::<serde_json::Value>(&cleaned) {
        collect_value(&v, &mut out);
        if !out.is_empty() {
            return out;
        }
    }
    // Fall back to line-by-line JSON objects.
    for line in cleaned.lines() {
        let line = line.trim().trim_end_matches(',');
        if line.is_empty() {
            continue;
        }
        if let Ok(v) = serde_json::from_str::<serde_json::Value>(line) {
            collect_value(&v, &mut out);
        }
    }
    out
}

fn collect_value(v: &serde_json::Value, out: &mut Vec<Item>) {
    match v {
        serde_json::Value::Array(arr) => {
            for el in arr {
                collect_value(el, out);
            }
        }
        serde_json::Value::Object(obj) => {
            let kind = obj
                .get("kind")
                .and_then(|x| x.as_str())
                .unwrap_or("")
                .to_owned();
            let text = obj
                .get("text")
                .and_then(|x| x.as_str())
                .unwrap_or("")
                .to_owned();
            // Require a real numeric confidence in [0,1]. Missing/garbage
            // confidence → 0.0, which fails MIN_CONFIDENCE and is dropped, so
            // adversarial output can't slip in unscored items.
            let confidence = match obj.get("confidence").and_then(|x| x.as_f64()) {
                Some(c) if c.is_finite() && (0.0..=1.0).contains(&c) => c as f32,
                _ => 0.0,
            };
            if !kind.is_empty() && !text.is_empty() {
                out.push(Item {
                    kind,
                    text,
                    confidence,
                });
            }
        }
        _ => {}
    }
}

/// Clean a model completion down to its JSON payload. The agent model
/// (rsclaw-agent-v1) is a reasoning model: it emits `<think>…</think>` blocks
/// and often wraps the JSON array in prose. So we (1) strip every think block,
/// (2) strip code fences, (3) slice from the first `[`/`{` to the last `]`/`}`.
/// Brackets are ASCII, so the byte-index slice is always on a char boundary —
/// safe even when the JSON contains CJK.
fn strip_fences(s: &str) -> String {
    let mut t = s.trim().to_owned();
    // Remove matched <think>...</think> reasoning blocks (can be several).
    const OPEN: &str = "<think>";
    const CLOSE: &str = "</think>";
    while let Some(open) = t.find(OPEN) {
        match t[open..].find(CLOSE) {
            Some(rel) => {
                let close_end = open + rel + CLOSE.len();
                t.replace_range(open..close_end, "");
            }
            None => break, // unmatched (truncated stream) — leave for bracket slice
        }
    }
    let t = t.trim();
    let t = t
        .strip_prefix("```json")
        .or_else(|| t.strip_prefix("```"))
        .unwrap_or(t);
    let t = t.strip_suffix("```").unwrap_or(t).trim();
    // Slice out the outermost JSON value, dropping leading/trailing prose
    // (and any unmatched-`<think>` remnant before the first bracket).
    match (t.find(['[', '{']), t.rfind([']', '}'])) {
        (Some(a), Some(b)) if b >= a => t[a..=b].to_owned(),
        _ => t.to_owned(),
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn salience_gate_drops_chitchat_and_questions() {
        assert!(!salience_gate("在吗？"));
        assert!(!salience_gate("这个怎么搞啊"));
        assert!(!salience_gate("hi"));
        assert!(!salience_gate("帮我查一下今天天气")); // task request, no self-info
    }

    #[test]
    fn salience_gate_fires_on_self_description() {
        assert!(salience_gate("我叫东升"));
        assert!(salience_gate("我比较喜欢简洁直接的回答，别啰嗦"));
        assert!(salience_gate("记一下我的发布流程：先 cargo test"));
        assert!(salience_gate("My name is Dongsheng"));
    }

    #[test]
    fn parse_handles_array_fences_and_lines() {
        let arr = r#"[{"kind":"preference","text":"用户偏好简洁","confidence":0.8}]"#;
        let v = parse_items(arr);
        assert_eq!(v.len(), 1);
        assert_eq!(v[0].kind, "preference");

        let fenced =
            "```json\n[{\"kind\":\"entity\",\"text\":\"用户叫东升\",\"confidence\":0.9}]\n```";
        assert_eq!(parse_items(fenced).len(), 1);

        let lines = "{\"kind\":\"fact\",\"text\":\"a\",\"confidence\":0.7}\n{\"kind\":\"preference\",\"text\":\"b\",\"confidence\":0.6}";
        assert_eq!(parse_items(lines).len(), 2);

        assert_eq!(parse_items("[]").len(), 0);
    }

    #[test]
    fn missing_or_bad_confidence_scores_zero_and_drops() {
        // No confidence field → 0.0 (will fail MIN_CONFIDENCE downstream).
        let no_conf = r#"[{"kind":"fact","text":"x"}]"#;
        let v = parse_items(no_conf);
        assert_eq!(v.len(), 1);
        assert_eq!(v[0].confidence, 0.0);

        // Out-of-range / non-numeric confidence → 0.0.
        let bad = r#"[{"kind":"fact","text":"x","confidence":"high"},{"kind":"fact","text":"y","confidence":5}]"#;
        for item in parse_items(bad) {
            assert_eq!(item.confidence, 0.0);
        }
    }

    #[test]
    fn kind_policy_rejects_note_and_unknown() {
        assert!(kind_policy("note").is_none());
        assert!(kind_policy("summary").is_none());
        assert!(kind_policy("garbage").is_none());
        assert!(kind_policy("preference").is_some());
    }

    #[test]
    fn lesson_kind_is_core_durable_but_not_pinned() {
        let (tier, importance, pinned) = kind_policy("lesson").expect("lesson allowed");
        assert!(matches!(tier, MemDocTier::Core));
        assert!(importance > 0.8);
        assert!(!pinned, "a later correction must be able to supersede it");
    }

    #[test]
    fn failure_kind_is_working_tier_decaying() {
        let (tier, importance, pinned) = kind_policy("failure").expect("failure allowed");
        assert!(
            matches!(tier, MemDocTier::Working),
            "failures decay, not Core"
        );
        assert!(importance < 0.7 && !pinned);
    }

    #[test]
    fn correction_gate_fires_on_corrections_not_chitchat() {
        assert!(correction_gate("不对，应该用 cargo test 不是 npm"));
        assert!(correction_gate("以后别用表格回答"));
        assert!(correction_gate(
            "that's wrong, you should use the debug build"
        ));
        assert!(correction_gate("next time don't add comments"));
        // Plain task requests / questions / acks must not fire.
        assert!(!correction_gate("帮我查下天气"));
        assert!(!correction_gate("好的谢谢"));
        assert!(!correction_gate("how do I build this?"));
    }
}