nika 0.35.4 - Docs.rs

//! Spawn Agent Tool (MVP 8 Phase 2)
//!
//! Internal tool for recursive agent spawning. Allows an agent to delegate
//! subtasks to child agents, enabling hierarchical task decomposition.
//!
//! ## Depth Limit
//!
//! To prevent infinite recursion, each spawn tracks depth and enforces limits:
//! - Default limit: 3 levels
//! - Maximum limit: 10 levels
//! - Spawning at max depth returns an error
//!
//! ## Events
//!
//! Spawning emits an `AgentSpawned` event with:
//! - `parent_task_id`: The spawning agent's task ID
//! - `child_task_id`: The new agent's task ID
//! - `depth`: Current recursion depth
//!
//! ## rig::ToolDyn Integration
//!
//! SpawnAgentTool implements `rig::tool::ToolDyn` for seamless integration
//! with `RigAgentLoop`. When an agent has `depth_limit > current_depth`,
//! the spawn_agent tool is automatically added to its tool list.
//!
//! ## Example
//!
//! ```json
//! {
//!   "task_id": "subtask-1",
//!   "prompt": "Generate the header section",
//!   "context": {"entity": "qr-code"},
//!   "max_turns": 5
//! }
//! ```

use std::future::Future;
use std::pin::Pin;
use std::sync::Arc;

use rig::completion::ToolDefinition;
use rig::tool::{ToolDyn, ToolError};
use rustc_hash::FxHashMap;
use serde::{Deserialize, Serialize};
use serde_json::{json, Value};

use crate::ast::AgentParams;
use crate::event::{EventKind, EventLog};
use crate::mcp::McpClient;

/// Parameters for spawning a child agent
#[derive(Debug, Clone, Serialize, Deserialize)]
pub struct SpawnAgentParams {
    /// Unique identifier for the child task
    pub task_id: String,
    /// Prompt/goal for the child agent
    pub prompt: String,
    /// Optional context data to pass to child
    #[serde(default)]
    pub context: Option<Value>,
    /// Optional max turns override for child
    #[serde(default)]
    pub max_turns: Option<u32>,
}

/// Internal tool for spawning sub-agents
///
/// This tool is automatically added to agents that have depth_limit > current_depth.
/// It allows recursive task decomposition with safety limits.
///
/// Implements `rig::tool::ToolDyn` for integration with RigAgentLoop.
#[derive(Clone)]
pub struct SpawnAgentTool {
    /// Current recursion depth (1 = root agent)
    current_depth: u32,
    /// Maximum allowed depth
    max_depth: u32,
    /// Parent task ID for event linking
    parent_task_id: Arc<str>,
    /// Event log for emitting AgentSpawned events
    event_log: EventLog,
    /// MCP clients for child agent tool access
    mcp_clients: FxHashMap<String, Arc<McpClient>>,
    /// MCP server names for child agents (from parent AgentParams.mcp)
    mcp_names: Vec<String>,
}

impl SpawnAgentTool {
    /// Create a new SpawnAgentTool (minimal - for testing without MCP)
    ///
    /// # Arguments
    /// * `current_depth` - Current recursion depth (starts at 1 for root)
    /// * `max_depth` - Maximum allowed depth (default 3)
    /// * `parent_task_id` - ID of the parent task
    /// * `event_log` - Shared event log for observability
    pub fn new(
        current_depth: u32,
        max_depth: u32,
        parent_task_id: Arc<str>,
        event_log: EventLog,
    ) -> Self {
        Self {
            current_depth,
            max_depth,
            parent_task_id,
            event_log,
            mcp_clients: FxHashMap::default(),
            mcp_names: Vec::new(),
        }
    }

    /// Create a new SpawnAgentTool with MCP clients (for production use)
    ///
    /// # Arguments
    /// * `current_depth` - Current recursion depth (starts at 1 for root)
    /// * `max_depth` - Maximum allowed depth (default 3)
    /// * `parent_task_id` - ID of the parent task
    /// * `event_log` - Shared event log for observability
    /// * `mcp_clients` - Connected MCP clients for child agent tools
    /// * `mcp_names` - MCP server names to pass to child agents
    pub fn with_mcp(
        current_depth: u32,
        max_depth: u32,
        parent_task_id: Arc<str>,
        event_log: EventLog,
        mcp_clients: FxHashMap<String, Arc<McpClient>>,
        mcp_names: Vec<String>,
    ) -> Self {
        Self {
            current_depth,
            max_depth,
            parent_task_id,
            event_log,
            mcp_clients,
            mcp_names,
        }
    }

    /// Get the tool name
    pub fn name(&self) -> &str {
        "spawn_agent"
    }

    /// Get the JSON Schema definition for this tool
    ///
    /// Note: OpenAI's strict mode requires ALL properties in `required` and
    /// `additionalProperties: false`. We keep the schema simple with only
    /// required fields - context and max_turns use sensible defaults.
    pub fn definition(&self) -> ToolDefinition {
        ToolDefinition {
            name: "spawn_agent".to_string(),
            description: "Spawn a sub-agent to handle a delegated subtask. The child agent \
                         runs independently with max 10 turns and returns its result."
                .to_string(),
            parameters: json!({
                "type": "object",
                "properties": {
                    "task_id": {
                        "type": "string",
                        "description": "Unique identifier for the child task (e.g., 'subtask-1')"
                    },
                    "prompt": {
                        "type": "string",
                        "description": "Goal/prompt describing what the child agent should accomplish"
                    }
                },
                "required": ["task_id", "prompt"],
                "additionalProperties": false
            }),
        }
    }

    /// Execute the spawn_agent tool
    ///
    /// Creates and runs a child `RigAgentLoop` with inherited MCP clients.
    /// The child agent runs to completion and its result is returned.
    ///
    /// # Errors
    /// Returns an error if:
    /// - Current depth >= max depth (depth limit reached)
    /// - Invalid arguments
    /// - Child agent execution fails
    pub async fn call(&self, args: String) -> Result<String, SpawnAgentError> {
        // Parse arguments
        let params: SpawnAgentParams =
            serde_json::from_str(&args).map_err(|e| SpawnAgentError::InvalidArgs(e.to_string()))?;

        // Check depth limit
        if self.current_depth >= self.max_depth {
            return Err(SpawnAgentError::DepthLimitReached {
                current: self.current_depth,
                max: self.max_depth,
            });
        }

        // Emit AgentSpawned event
        let child_depth = self.current_depth + 1;
        self.event_log.emit(EventKind::AgentSpawned {
            parent_task_id: self.parent_task_id.clone(),
            child_task_id: Arc::from(params.task_id.as_str()),
            depth: child_depth,
        });

        // If no MCP clients, return placeholder (for compatibility with tests)
        if self.mcp_clients.is_empty() {
            return Ok(json!({
                "status": "spawned",
                "child_task_id": params.task_id,
                "depth": child_depth,
                "note": "Child agent execution requires MCP client context"
            })
            .to_string());
        }

        // Build child AgentParams
        // Calculate remaining depth from PARENT's current_depth, not child_depth.
        // With depth_limit=3:
        //   - Root (depth=1, max=3): remaining = 3-1 = 2 → child gets max=2
        //   - Child (depth=1, max=2): remaining = 2-1 = 1 → grandchild gets max=1
        //   - Grandchild (depth=1, max=1): 1 >= 1, cannot spawn ✓
        let remaining_depth = self.max_depth.saturating_sub(self.current_depth);
        let child_params = AgentParams {
            prompt: params.prompt,
            system: params.context.as_ref().map(|ctx| {
                format!(
                    "Context from parent agent:\n{}",
                    serde_json::to_string_pretty(ctx).unwrap_or_default()
                )
            }),
            mcp: self.mcp_names.clone(),
            max_turns: params.max_turns.or(Some(10)),
            depth_limit: Some(remaining_depth),
            ..Default::default()
        };

        // Create child RigAgentLoop
        let mut child_loop = super::RigAgentLoop::new(
            params.task_id.clone(),
            child_params,
            self.event_log.clone(),
            self.mcp_clients.clone(),
        )
        .map_err(|e| SpawnAgentError::ExecutionFailed(e.to_string()))?;

        // Execute child agent with auto-detected provider (production mode)
        // Uses ANTHROPIC_API_KEY or OPENAI_API_KEY from environment
        let result = child_loop
            .run_auto()
            .await
            .map_err(|e| SpawnAgentError::ExecutionFailed(e.to_string()))?;

        // Return child's result
        Ok(json!({
            "status": "completed",
            "child_task_id": params.task_id,
            "depth": child_depth,
            "result": result.final_output,
            "turns": result.turns,
            "total_tokens": result.total_tokens
        })
        .to_string())
    }

    /// Check if spawning is allowed at current depth
    pub fn can_spawn(&self) -> bool {
        self.current_depth < self.max_depth
    }

    /// Get the depth that child agents would have
    pub fn child_depth(&self) -> u32 {
        self.current_depth + 1
    }
}

/// Errors that can occur when spawning agents
#[derive(Debug, thiserror::Error)]
pub enum SpawnAgentError {
    #[error("spawn_agent: depth limit reached (current: {current}, max: {max})")]
    DepthLimitReached { current: u32, max: u32 },

    #[error("spawn_agent: invalid arguments - {0}")]
    InvalidArgs(String),

    #[error("spawn_agent: execution failed - {0}")]
    ExecutionFailed(String),
}

impl std::fmt::Debug for SpawnAgentTool {
    fn fmt(&self, f: &mut std::fmt::Formatter<'_>) -> std::fmt::Result {
        f.debug_struct("SpawnAgentTool")
            .field("current_depth", &self.current_depth)
            .field("max_depth", &self.max_depth)
            .field("parent_task_id", &self.parent_task_id)
            .finish()
    }
}

// ═══════════════════════════════════════════════════════════════════════════════
// rig::ToolDyn implementation (for integration with RigAgentLoop)
// ═══════════════════════════════════════════════════════════════════════════════

/// Type alias for boxed future (required by ToolDyn)
type BoxFuture<'a, T> = Pin<Box<dyn Future<Output = T> + Send + 'a>>;

impl ToolDyn for SpawnAgentTool {
    fn name(&self) -> String {
        "spawn_agent".to_string()
    }

    fn definition(&self, _prompt: String) -> BoxFuture<'_, ToolDefinition> {
        // Note: OpenAI's strict mode requires ALL properties in `required` and
        // `additionalProperties: false`. Keep schema simple with only required fields.
        let def = ToolDefinition {
            name: "spawn_agent".to_string(),
            description: "Spawn a sub-agent to handle a delegated subtask. The child agent \
                         runs independently with max 10 turns and returns its result."
                .to_string(),
            parameters: json!({
                "type": "object",
                "properties": {
                    "task_id": {
                        "type": "string",
                        "description": "Unique identifier for the child task (e.g., 'subtask-1')"
                    },
                    "prompt": {
                        "type": "string",
                        "description": "Goal/prompt describing what the child agent should accomplish"
                    }
                },
                "required": ["task_id", "prompt"],
                "additionalProperties": false
            }),
        };
        Box::pin(async move { def })
    }

    fn call(&self, args: String) -> BoxFuture<'_, Result<String, ToolError>> {
        Box::pin(async move {
            self.call(args).await.map_err(|e| {
                ToolError::ToolCallError(Box::new(std::io::Error::other(e.to_string())))
            })
        })
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn spawn_agent_tool_name() {
        let tool = SpawnAgentTool::new(1, 3, "parent".into(), EventLog::new());
        assert_eq!(tool.name(), "spawn_agent");
    }

    #[test]
    fn spawn_agent_tool_can_spawn() {
        let tool = SpawnAgentTool::new(1, 3, "parent".into(), EventLog::new());
        assert!(tool.can_spawn());

        let at_limit = SpawnAgentTool::new(3, 3, "parent".into(), EventLog::new());
        assert!(!at_limit.can_spawn());
    }

    #[test]
    fn spawn_agent_tool_child_depth() {
        let tool = SpawnAgentTool::new(1, 3, "parent".into(), EventLog::new());
        assert_eq!(tool.child_depth(), 2);
    }

    #[test]
    fn spawn_agent_params_deserializes() {
        let json = json!({
            "task_id": "child-1",
            "prompt": "Do something",
            "context": {"key": "value"},
            "max_turns": 5
        });

        let params: SpawnAgentParams = serde_json::from_value(json).unwrap();
        assert_eq!(params.task_id, "child-1");
        assert_eq!(params.prompt, "Do something");
        assert!(params.context.is_some());
        assert_eq!(params.max_turns, Some(5));
    }

    #[test]
    fn spawn_agent_params_minimal() {
        let json = json!({
            "task_id": "child-1",
            "prompt": "Do something"
        });

        let params: SpawnAgentParams = serde_json::from_value(json).unwrap();
        assert_eq!(params.task_id, "child-1");
        assert!(params.context.is_none());
        assert!(params.max_turns.is_none());
    }

    #[tokio::test]
    async fn spawn_agent_at_max_depth_fails() {
        let tool = SpawnAgentTool::new(3, 3, "parent".into(), EventLog::new());

        let args = json!({
            "task_id": "child-1",
            "prompt": "Do something"
        })
        .to_string();

        let result = tool.call(args).await;
        assert!(result.is_err());

        let err = result.unwrap_err();
        assert!(err.to_string().contains("depth limit"));
    }

    #[tokio::test]
    async fn spawn_agent_below_max_depth_succeeds() {
        let tool = SpawnAgentTool::new(2, 3, "parent".into(), EventLog::new());

        let args = json!({
            "task_id": "child-1",
            "prompt": "Do something"
        })
        .to_string();

        let result = tool.call(args).await;
        assert!(result.is_ok());

        let response: Value = serde_json::from_str(&result.unwrap()).unwrap();
        assert_eq!(response["status"], "spawned");
        assert_eq!(response["child_task_id"], "child-1");
        assert_eq!(response["depth"], 3);
    }

    #[tokio::test]
    async fn spawn_agent_emits_event() {
        let event_log = EventLog::new();
        let tool = SpawnAgentTool::new(1, 3, "parent".into(), event_log.clone());

        let args = json!({
            "task_id": "child-1",
            "prompt": "Do something"
        })
        .to_string();

        let _ = tool.call(args).await;

        // Check that AgentSpawned event was emitted
        let events = event_log.events();
        let spawned_events: Vec<_> = events
            .iter()
            .filter(|e| matches!(e.kind, EventKind::AgentSpawned { .. }))
            .collect();

        assert_eq!(spawned_events.len(), 1);

        if let EventKind::AgentSpawned {
            parent_task_id,
            child_task_id,
            depth,
        } = &spawned_events[0].kind
        {
            assert_eq!(&**parent_task_id, "parent");
            assert_eq!(&**child_task_id, "child-1");
            assert_eq!(*depth, 2);
        }
    }

    #[test]
    fn tool_definition_has_required_params() {
        let tool = SpawnAgentTool::new(1, 3, "parent".into(), EventLog::new());
        let def = tool.definition();

        let required = def
            .parameters
            .get("required")
            .and_then(|v| v.as_array())
            .expect("required should be an array");

        // OpenAI strict mode: all properties in required + additionalProperties: false
        // We keep schema simple with only task_id and prompt (context/max_turns use defaults)
        assert!(required.iter().any(|v| v == "task_id"));
        assert!(required.iter().any(|v| v == "prompt"));
        assert_eq!(required.len(), 2);

        // Check additionalProperties is false (required for OpenAI strict mode)
        let additional = def
            .parameters
            .get("additionalProperties")
            .expect("additionalProperties should exist");
        assert_eq!(additional, false);
    }

    // =========================================================================
    // rig::ToolDyn implementation tests
    // =========================================================================

    #[test]
    fn spawn_agent_implements_tool_dyn() {
        use rig::tool::ToolDyn;

        let tool = SpawnAgentTool::new(1, 3, "parent".into(), EventLog::new());

        // Test ToolDyn::name()
        let name: String = ToolDyn::name(&tool);
        assert_eq!(name, "spawn_agent");
    }

    #[tokio::test]
    async fn spawn_agent_tool_dyn_definition_returns_correct_schema() {
        use rig::tool::ToolDyn;

        let tool = SpawnAgentTool::new(1, 3, "parent".into(), EventLog::new());

        // Test ToolDyn::definition()
        let def = ToolDyn::definition(&tool, "test".to_string()).await;

        assert_eq!(def.name, "spawn_agent");
        assert!(def.description.contains("sub-agent"));
        assert!(def.parameters.get("required").is_some());
    }

    #[tokio::test]
    async fn spawn_agent_tool_dyn_call_enforces_depth_limit() {
        use rig::tool::ToolDyn;

        let tool = SpawnAgentTool::new(3, 3, "parent".into(), EventLog::new());

        let args = json!({
            "task_id": "child-1",
            "prompt": "Do something"
        })
        .to_string();

        // Test ToolDyn::call() - should fail at max depth
        let result = ToolDyn::call(&tool, args).await;
        assert!(result.is_err());
        assert!(result.unwrap_err().to_string().contains("depth limit"));
    }

    #[test]
    fn spawn_agent_with_mcp_creates_correctly() {
        let event_log = EventLog::new();
        let mcp_clients = FxHashMap::default();
        let mcp_names = vec!["novanet".to_string()];

        let tool = SpawnAgentTool::with_mcp(
            1,
            3,
            "parent".into(),
            event_log,
            mcp_clients,
            mcp_names.clone(),
        );

        assert_eq!(tool.name(), "spawn_agent");
        assert!(tool.can_spawn());
        assert_eq!(tool.child_depth(), 2);
    }

    // =========================================================================
    // Depth calculation regression tests
    // =========================================================================

    #[test]
    fn depth_calculation_allows_three_levels() {
        // With depth_limit=3, we should allow:
        // - Root (depth=1) → can spawn child
        // - Child (depth=2) → can spawn grandchild
        // - Grandchild (depth=3) → cannot spawn

        // Root agent: current=1, max=3
        let root = SpawnAgentTool::new(1, 3, "root".into(), EventLog::new());
        assert!(root.can_spawn(), "Root should be able to spawn");
        assert_eq!(root.child_depth(), 2);

        // Simulate what child receives: remaining = max - current = 3 - 1 = 2
        // So child sees: current=1, max=2
        let child = SpawnAgentTool::new(1, 2, "child".into(), EventLog::new());
        assert!(
            child.can_spawn(),
            "Child should be able to spawn grandchild"
        );
        assert_eq!(child.child_depth(), 2);

        // Simulate what grandchild receives: remaining = max - current = 2 - 1 = 1
        // So grandchild sees: current=1, max=1
        let grandchild = SpawnAgentTool::new(1, 1, "grandchild".into(), EventLog::new());
        assert!(
            !grandchild.can_spawn(),
            "Grandchild should NOT be able to spawn"
        );
    }

    #[test]
    fn remaining_depth_calculation_formula() {
        // Verify the formula: remaining_depth = max_depth - current_depth
        // NOT: max_depth - child_depth (old buggy formula)

        // Root: current=1, max=3
        let root_current = 1_u32;
        let root_max = 3_u32;
        let child_will_receive = root_max.saturating_sub(root_current); // 3-1=2 ✓
        assert_eq!(child_will_receive, 2, "Child should receive depth_limit=2");

        // Child (simulated): current=1, max=2
        let child_current = 1_u32;
        let child_max = child_will_receive; // 2
        let grandchild_will_receive = child_max.saturating_sub(child_current); // 2-1=1 ✓
        assert_eq!(
            grandchild_will_receive, 1,
            "Grandchild should receive depth_limit=1"
        );

        // Grandchild (simulated): current=1, max=1
        let grandchild_current = 1_u32;
        let grandchild_max = grandchild_will_receive; // 1
        let can_spawn = grandchild_current < grandchild_max; // 1 < 1 = false ✓
        assert!(!can_spawn, "Grandchild should not be able to spawn");
    }
}