hippox-drivers 0.3.1

🦛All indivisible atomic driver units in Hippox.
//! Screenshot Driver

use crate::{
    DriverCallback, DriverCategory, DriverContext,
    types::{Driver, DriverParameter},
};
use anyhow::Result;
use image::{GenericImageView, ImageBuffer, Rgba};
use serde_json::{Value, json};
use std::collections::HashMap;

#[derive(Debug)]
pub struct ScreenshotDriver;

#[async_trait::async_trait]
impl Driver for ScreenshotDriver {
    fn name(&self) -> &str {
        "screenshot"
    }

    fn description(&self) -> &str {
        "Capture a screenshot of the entire screen or a region"
    }

    fn usage_hint(&self) -> &str {
        "Use this skill to capture screenshots. Specify region with x, y, width, height."
    }

    fn parameters(&self) -> Vec<DriverParameter> {
        vec![
            DriverParameter {
                name: "destination".to_string(),
                param_type: "string".to_string(),
                description: "Output file path (PNG format)".to_string(),
                required: true,
                default: None,
                example: Some(Value::String("/path/to/screenshot.png".to_string())),
                enum_values: None,
            },
            DriverParameter {
                name: "x".to_string(),
                param_type: "integer".to_string(),
                description: "X coordinate of capture region".to_string(),
                required: false,
                default: None,
                example: Some(Value::Number(100.into())),
                enum_values: None,
            },
            DriverParameter {
                name: "y".to_string(),
                param_type: "integer".to_string(),
                description: "Y coordinate of capture region".to_string(),
                required: false,
                default: None,
                example: Some(Value::Number(100.into())),
                enum_values: None,
            },
            DriverParameter {
                name: "width".to_string(),
                param_type: "integer".to_string(),
                description: "Width of capture region".to_string(),
                required: false,
                default: None,
                example: Some(Value::Number(800.into())),
                enum_values: None,
            },
            DriverParameter {
                name: "height".to_string(),
                param_type: "integer".to_string(),
                description: "Height of capture region".to_string(),
                required: false,
                default: None,
                example: Some(Value::Number(600.into())),
                enum_values: None,
            },
        ]
    }

    fn example_call(&self) -> Value {
        json!({
            "action": "screenshot",
            "parameters": {
                "destination": "/screenshots/desktop.png"
            }
        })
    }

    fn example_output(&self) -> String {
        "Screenshot saved to /screenshots/desktop.png".to_string()
    }

    fn category(&self) -> DriverCategory {
        DriverCategory::Media
    }

    async fn execute(
        &self,
        parameters: &HashMap<String, Value>,
        callback: Option<&dyn DriverCallback>,
        context: Option<&DriverContext>,
    ) -> Result<String> {
        let task_id = context.as_ref().and_then(|c| c.task_id()).map(String::from);
        let driver_index = context.as_ref().and_then(|c| c.driver_index());
        let step_name = context
            .as_ref()
            .and_then(|c| c.driver_name())
            .map(String::from);
        let cb = callback;
        if let Some(cb) = cb {
            cb.on_start(task_id.clone(), driver_index, step_name);
            cb.on_log(
                task_id.clone(),
                driver_index,
                Some("Starting screenshot capture".to_string()),
            );
            cb.on_progress(task_id.clone(), driver_index, Some(10), None);
        }
        let destination = parameters
            .get("destination")
            .and_then(|v| v.as_str())
            .ok_or_else(|| anyhow::anyhow!("Missing 'destination' parameter"))?;
        let x = parameters
            .get("x")
            .and_then(|v| v.as_i64())
            .map(|v| v as u32);
        let y = parameters
            .get("y")
            .and_then(|v| v.as_i64())
            .map(|v| v as u32);
        let width = parameters
            .get("width")
            .and_then(|v| v.as_u64())
            .map(|v| v as u32);
        let height = parameters
            .get("height")
            .and_then(|v| v.as_u64())
            .map(|v| v as u32);
        if let Some(cb) = cb {
            cb.on_log(
                task_id.clone(),
                driver_index,
                Some(format!(
                    "Destination: {:?}, region: x={:?}, y={:?}, w={:?}, h={:?}",
                    destination, x, y, width, height
                )),
            );
            cb.on_progress(task_id.clone(), driver_index, Some(20), None);
        }
        use xcap::Monitor;
        if let Some(cb) = cb {
            cb.on_log(
                task_id.clone(),
                driver_index,
                Some("Getting monitors...".to_string()),
            );
            cb.on_progress(task_id.clone(), driver_index, Some(30), None);
        }
        let monitors =
            Monitor::all().map_err(|e| anyhow::anyhow!("Failed to get monitors: {}", e))?;
        let monitor = monitors
            .first()
            .ok_or_else(|| anyhow::anyhow!("No monitor found"))?;
        if let Some(cb) = cb {
            cb.on_log(
                task_id.clone(),
                driver_index,
                Some("Capturing screen...".to_string()),
            );
            cb.on_progress(task_id.clone(), driver_index, Some(50), None);
        }
        let image = monitor
            .capture_image()
            .map_err(|e| anyhow::anyhow!("Failed to capture screen: {}", e))?;
        if let Some(cb) = cb {
            cb.on_log(
                task_id.clone(),
                driver_index,
                Some("Processing captured image...".to_string()),
            );
            cb.on_progress(task_id.clone(), driver_index, Some(70), None);
        }
        let result = if let (Some(x), Some(y), Some(w), Some(h)) = (x, y, width, height) {
            let (img_w, img_h) = image.dimensions();
            if x + w <= img_w && y + h <= img_h {
                image::imageops::crop(&mut image.clone(), x, y, w, h).to_image()
            } else {
                anyhow::bail!(
                    "Crop region out of bounds: image size {}x{}, region {}x{} at ({}, {})",
                    img_w,
                    img_h,
                    w,
                    h,
                    x,
                    y
                );
            }
        } else {
            image
        };
        if let Some(cb) = cb {
            cb.on_log(
                task_id.clone(),
                driver_index,
                Some("Saving screenshot...".to_string()),
            );
            cb.on_progress(task_id.clone(), driver_index, Some(85), None);
        }
        result
            .save(destination)
            .map_err(|e| anyhow::anyhow!("Failed to save screenshot: {}", e))?;
        let result_msg = format!("Screenshot saved to {}", destination);
        if let Some(cb) = cb {
            cb.on_log(
                task_id.clone(),
                driver_index,
                Some(format!("Result: {}", result_msg)),
            );
            cb.on_progress(task_id.clone(), driver_index, Some(100), None);
            cb.on_complete(
                task_id.clone(),
                driver_index,
                Some("screenshot".to_string()),
                Some(result_msg.clone()),
            );
        }
        Ok(result_msg)
    }
}