entrenar 0.7.9 - Docs.rs

//! Extended command types - Completion, Bench, Inspect, Audit, Monitor, Publish

use clap::{Parser, Subcommand};
use std::path::PathBuf;

use super::types::{AuditType, InspectMode, OutputFormat, ShellType};

/// Arguments for completion command
#[derive(Parser, Debug, Clone, PartialEq)]
pub struct CompletionArgs {
    /// Shell to generate completions for
    #[arg(value_name = "SHELL")]
    pub shell: ShellType,
}

/// Arguments for bench command
#[derive(Parser, Debug, Clone, PartialEq)]
pub struct BenchArgs {
    /// Path to model or config file
    #[arg(value_name = "INPUT")]
    pub input: PathBuf,

    /// Number of warmup iterations
    #[arg(long, default_value = "10")]
    pub warmup: usize,

    /// Number of benchmark iterations
    #[arg(long, default_value = "100")]
    pub iterations: usize,

    /// Batch sizes to test (comma-separated)
    #[arg(long, default_value = "1,8,32")]
    pub batch_sizes: String,

    /// Output format (text, json)
    #[arg(short, long, default_value = "text")]
    pub format: OutputFormat,
}

/// Arguments for inspect command
#[derive(Parser, Debug, Clone, PartialEq)]
pub struct InspectArgs {
    /// Path to data file or model
    #[arg(value_name = "INPUT")]
    pub input: PathBuf,

    /// Inspection mode
    #[arg(short, long, default_value = "summary")]
    pub mode: InspectMode,

    /// Columns to inspect (comma-separated)
    #[arg(long)]
    pub columns: Option<String>,

    /// Z-score threshold for outlier detection
    #[arg(long, default_value = "3.0")]
    pub z_threshold: f32,
}

/// Arguments for audit command
#[derive(Parser, Debug, Clone, PartialEq)]
pub struct AuditArgs {
    /// Path to model or config file
    #[arg(value_name = "INPUT")]
    pub input: PathBuf,

    /// Audit type
    #[arg(short, long, default_value = "bias")]
    pub audit_type: AuditType,

    /// Protected attribute column
    #[arg(long)]
    pub protected_attr: Option<String>,

    /// Fairness threshold (0.0-1.0)
    #[arg(long, default_value = "0.8")]
    pub threshold: f32,

    /// Output format (text, json, html)
    #[arg(short, long, default_value = "text")]
    pub format: OutputFormat,
}

/// Arguments for monitor command
#[derive(Parser, Debug, Clone, PartialEq)]
pub struct MonitorArgs {
    /// Path to model or config file
    #[arg(value_name = "INPUT")]
    pub input: PathBuf,

    /// Baseline statistics file
    #[arg(long)]
    pub baseline: Option<PathBuf>,

    /// Drift detection threshold (PSI)
    #[arg(long, default_value = "0.2")]
    pub threshold: f32,

    /// Monitoring interval in seconds
    #[arg(long, default_value = "60")]
    pub interval: u64,

    /// Output format (text, json)
    #[arg(short, long, default_value = "text")]
    pub format: OutputFormat,
}

/// Arguments for the publish command
#[derive(Parser, Debug, Clone, PartialEq)]
pub struct PublishArgs {
    /// Path to trained model output directory
    #[arg(value_name = "MODEL_DIR", default_value = "./output")]
    pub model_dir: PathBuf,

    /// HuggingFace repo ID (e.g., myuser/my-model)
    #[arg(long)]
    pub repo: String,

    /// Make the repository private
    #[arg(long)]
    pub private: bool,

    /// Generate and upload a model card
    #[arg(long, default_value_t = true)]
    pub model_card: bool,

    /// Merge LoRA adapters into base weights before publishing
    #[arg(long)]
    pub merge_adapters: bool,

    /// Base model HF repo ID (for model card metadata)
    #[arg(long)]
    pub base_model: Option<String>,

    /// Export format (safetensors or gguf)
    #[arg(long, default_value = "safetensors")]
    pub format: String,

    /// Dry run (validate but don't upload)
    #[arg(long)]
    pub dry_run: bool,
}

/// Arguments for the finetune command (plan/apply classification training)
#[derive(Parser, Debug, Clone, PartialEq)]
pub struct FinetuneArgs {
    /// Subcommand to execute
    #[command(subcommand)]
    pub command: FinetuneCommand,
}

/// Finetune subcommands (forjar-style plan/apply)
#[derive(Subcommand, Debug, Clone, PartialEq)]
pub enum FinetuneCommand {
    /// Generate a training plan (validate data, estimate resources, build HPO config)
    Plan {
        /// Path to training data (JSONL with {"input": ..., "label": N})
        #[arg(long)]
        data: PathBuf,

        /// Path to model weights directory (e.g., Qwen2.5-Coder-0.5B)
        #[arg(long)]
        model_path: Option<PathBuf>,

        /// Model size hint (e.g., "0.5B", "9B")
        #[arg(long, default_value = "0.5B")]
        model_size: String,

        /// Number of output classes
        #[arg(long, default_value = "5")]
        num_classes: usize,

        /// Output directory for plan and checkpoints
        #[arg(short, long, default_value = "./output")]
        output_dir: PathBuf,

        /// HPO strategy: tpe, grid, random, or manual
        #[arg(long, default_value = "tpe")]
        strategy: String,

        /// HPO budget (number of trials)
        #[arg(long, default_value = "20")]
        budget: usize,

        /// Scout mode (1 epoch per trial for fast HPO)
        #[arg(long)]
        scout: bool,

        /// Maximum epochs per trial
        #[arg(long, default_value = "10")]
        max_epochs: usize,

        /// Manual learning rate (for strategy=manual)
        #[arg(long)]
        lr: Option<f32>,

        /// Manual LoRA rank (for strategy=manual)
        #[arg(long)]
        lora_rank: Option<usize>,

        /// Manual batch size (for strategy=manual)
        #[arg(long)]
        batch_size: Option<usize>,

        /// LoRA alpha (for strategy=manual; defaults to lora_rank)
        #[arg(long)]
        lora_alpha: Option<f32>,

        /// Warmup fraction (for strategy=manual; default 0.1)
        #[arg(long)]
        warmup: Option<f32>,

        /// Gradient clip norm (for strategy=manual; default 1.0)
        #[arg(long)]
        gradient_clip: Option<f32>,

        /// LR min ratio for cosine decay (for strategy=manual; default 0.01)
        #[arg(long)]
        lr_min_ratio: Option<f32>,

        /// Class weight strategy: uniform, inverse_freq, sqrt_inverse
        #[arg(long)]
        class_weights: Option<String>,

        /// Target modules: qv, qkv, all_linear
        #[arg(long)]
        target_modules: Option<String>,
    },

    /// Execute a training plan (load model, run trials, save checkpoints)
    Apply {
        /// Path to plan YAML/JSON (generated by `finetune plan`)
        #[arg(long)]
        plan: PathBuf,

        /// Path to model weights directory
        #[arg(long)]
        model_path: PathBuf,

        /// Path to training data (JSONL)
        #[arg(long)]
        data: PathBuf,

        /// Output directory for checkpoints and leaderboard
        #[arg(short, long, default_value = "./output")]
        output_dir: PathBuf,
    },
}

/// Arguments for the experiments command
#[derive(Parser, Debug, Clone, PartialEq)]
pub struct ExperimentsArgs {
    /// Subcommand to execute
    #[command(subcommand)]
    pub command: ExperimentsCommand,

    /// Project directory (defaults to current directory)
    #[arg(short, long, global = true, default_value = ".")]
    pub project: PathBuf,

    /// Output format (text, json)
    #[arg(short, long, global = true, default_value = "text")]
    pub format: OutputFormat,
}

/// Experiment store subcommands
#[derive(Subcommand, Debug, Clone, PartialEq)]
pub enum ExperimentsCommand {
    /// List all experiments
    List,

    /// Show details of a specific experiment
    Show {
        /// Experiment ID
        #[arg(value_name = "ID")]
        id: String,
    },

    /// List runs for an experiment
    Runs {
        /// Experiment ID
        #[arg(value_name = "EXPERIMENT_ID")]
        experiment_id: String,
    },

    /// Show metrics for a run
    Metrics {
        /// Run ID
        #[arg(value_name = "RUN_ID")]
        run_id: String,

        /// Metric key (e.g., "loss", "accuracy")
        #[arg(value_name = "KEY")]
        key: String,
    },

    /// Delete an experiment and all its runs
    Delete {
        /// Experiment ID
        #[arg(value_name = "ID")]
        id: String,
    },
}

#[cfg(test)]
mod tests {
    use super::*;
    use crate::config::cli::parse_args;

    #[test]
    fn test_parse_completion_command() {
        let cli = parse_args(["entrenar", "completion", "bash"]).expect("parsing should succeed");
        match cli.command {
            crate::config::cli::Command::Completion(args) => {
                assert_eq!(args.shell, ShellType::Bash);
            }
            _ => panic!("Expected Completion command"),
        }
    }

    #[test]
    fn test_parse_bench_command() {
        let cli = parse_args(["entrenar", "bench", "model.gguf"]).expect("parsing should succeed");
        match cli.command {
            crate::config::cli::Command::Bench(args) => {
                assert_eq!(args.input, PathBuf::from("model.gguf"));
                assert_eq!(args.warmup, 10);
                assert_eq!(args.iterations, 100);
                assert_eq!(args.batch_sizes, "1,8,32");
            }
            _ => panic!("Expected Bench command"),
        }
    }

    #[test]
    fn test_parse_bench_with_options() {
        let cli = parse_args([
            "entrenar",
            "bench",
            "model.gguf",
            "--warmup",
            "5",
            "--iterations",
            "50",
            "--batch-sizes",
            "1,2,4,8",
            "--format",
            "json",
        ])
        .expect("operation should succeed");
        match cli.command {
            crate::config::cli::Command::Bench(args) => {
                assert_eq!(args.warmup, 5);
                assert_eq!(args.iterations, 50);
                assert_eq!(args.batch_sizes, "1,2,4,8");
                assert_eq!(args.format, OutputFormat::Json);
            }
            _ => panic!("Expected Bench command"),
        }
    }

    #[test]
    fn test_parse_inspect_command() {
        let cli =
            parse_args(["entrenar", "inspect", "data.parquet"]).expect("parsing should succeed");
        match cli.command {
            crate::config::cli::Command::Inspect(args) => {
                assert_eq!(args.input, PathBuf::from("data.parquet"));
                assert_eq!(args.mode, InspectMode::Summary);
                assert!((args.z_threshold - 3.0).abs() < 1e-6);
            }
            _ => panic!("Expected Inspect command"),
        }
    }

    #[test]
    fn test_parse_inspect_with_options() {
        let cli = parse_args([
            "entrenar",
            "inspect",
            "data.parquet",
            "--mode",
            "outliers",
            "--columns",
            "col1,col2",
            "--z-threshold",
            "2.5",
        ])
        .expect("operation should succeed");
        match cli.command {
            crate::config::cli::Command::Inspect(args) => {
                assert_eq!(args.mode, InspectMode::Outliers);
                assert_eq!(args.columns, Some("col1,col2".to_string()));
                assert!((args.z_threshold - 2.5).abs() < 1e-6);
            }
            _ => panic!("Expected Inspect command"),
        }
    }

    #[test]
    fn test_parse_audit_command() {
        let cli = parse_args(["entrenar", "audit", "model.gguf"]).expect("parsing should succeed");
        match cli.command {
            crate::config::cli::Command::Audit(args) => {
                assert_eq!(args.input, PathBuf::from("model.gguf"));
                assert_eq!(args.audit_type, AuditType::Bias);
                assert!((args.threshold - 0.8).abs() < 1e-6);
            }
            _ => panic!("Expected Audit command"),
        }
    }

    #[test]
    fn test_parse_audit_with_options() {
        let cli = parse_args([
            "entrenar",
            "audit",
            "model.gguf",
            "--audit-type",
            "fairness",
            "--protected-attr",
            "gender",
            "--threshold",
            "0.9",
            "--format",
            "json",
        ])
        .expect("operation should succeed");
        match cli.command {
            crate::config::cli::Command::Audit(args) => {
                assert_eq!(args.audit_type, AuditType::Fairness);
                assert_eq!(args.protected_attr, Some("gender".to_string()));
                assert!((args.threshold - 0.9).abs() < 1e-6);
                assert_eq!(args.format, OutputFormat::Json);
            }
            _ => panic!("Expected Audit command"),
        }
    }

    #[test]
    fn test_parse_monitor_command() {
        let cli =
            parse_args(["entrenar", "monitor", "model.gguf"]).expect("parsing should succeed");
        match cli.command {
            crate::config::cli::Command::Monitor(args) => {
                assert_eq!(args.input, PathBuf::from("model.gguf"));
                assert!((args.threshold - 0.2).abs() < 1e-6);
                assert_eq!(args.interval, 60);
            }
            _ => panic!("Expected Monitor command"),
        }
    }

    #[test]
    fn test_parse_monitor_with_options() {
        let cli = parse_args([
            "entrenar",
            "monitor",
            "model.gguf",
            "--baseline",
            "baseline.json",
            "--threshold",
            "0.3",
            "--interval",
            "120",
            "--format",
            "json",
        ])
        .expect("operation should succeed");
        match cli.command {
            crate::config::cli::Command::Monitor(args) => {
                assert_eq!(args.baseline, Some(PathBuf::from("baseline.json")));
                assert!((args.threshold - 0.3).abs() < 1e-6);
                assert_eq!(args.interval, 120);
                assert_eq!(args.format, OutputFormat::Json);
            }
            _ => panic!("Expected Monitor command"),
        }
    }

    // Additional coverage tests for derive traits

    #[test]
    fn test_completion_args_debug_clone() {
        let args = CompletionArgs { shell: ShellType::Bash };
        let debug = format!("{args:?}");
        assert!(debug.contains("CompletionArgs"));

        let cloned = args.clone();
        assert_eq!(args, cloned);
    }

    #[test]
    fn test_bench_args_debug_clone() {
        let args = BenchArgs {
            input: PathBuf::from("model.bin"),
            warmup: 5,
            iterations: 50,
            batch_sizes: "1,2,4".to_string(),
            format: OutputFormat::Text,
        };
        let debug = format!("{args:?}");
        assert!(debug.contains("BenchArgs"));

        let cloned = args.clone();
        assert_eq!(args, cloned);
    }

    #[test]
    fn test_inspect_args_debug_clone() {
        let args = InspectArgs {
            input: PathBuf::from("data.csv"),
            mode: InspectMode::Outliers,
            columns: Some("col1".to_string()),
            z_threshold: 2.5,
        };
        let debug = format!("{args:?}");
        assert!(debug.contains("InspectArgs"));

        let cloned = args.clone();
        assert_eq!(args, cloned);
    }

    #[test]
    fn test_audit_args_debug_clone() {
        let args = AuditArgs {
            input: PathBuf::from("model.bin"),
            audit_type: AuditType::Bias,
            protected_attr: Some("age".to_string()),
            threshold: 0.75,
            format: OutputFormat::Json,
        };
        let debug = format!("{args:?}");
        assert!(debug.contains("AuditArgs"));

        let cloned = args.clone();
        assert_eq!(args, cloned);
    }

    #[test]
    fn test_monitor_args_debug_clone() {
        let args = MonitorArgs {
            input: PathBuf::from("model.bin"),
            baseline: Some(PathBuf::from("base.json")),
            threshold: 0.25,
            interval: 30,
            format: OutputFormat::Text,
        };
        let debug = format!("{args:?}");
        assert!(debug.contains("MonitorArgs"));

        let cloned = args.clone();
        assert_eq!(args, cloned);
    }

    #[test]
    fn test_completion_other_shells() {
        // Test other shell types for coverage
        let cli = parse_args(["entrenar", "completion", "zsh"]).expect("parsing should succeed");
        match cli.command {
            crate::config::cli::Command::Completion(args) => {
                assert_eq!(args.shell, ShellType::Zsh);
            }
            _ => panic!("Expected Completion command"),
        }

        let cli = parse_args(["entrenar", "completion", "fish"]).expect("parsing should succeed");
        match cli.command {
            crate::config::cli::Command::Completion(args) => {
                assert_eq!(args.shell, ShellType::Fish);
            }
            _ => panic!("Expected Completion command"),
        }
    }

    #[test]
    fn test_inspect_distribution_mode() {
        let cli = parse_args(["entrenar", "inspect", "data.csv", "--mode", "distribution"])
            .expect("parsing should succeed");
        match cli.command {
            crate::config::cli::Command::Inspect(args) => {
                assert_eq!(args.mode, InspectMode::Distribution);
            }
            _ => panic!("Expected Inspect command"),
        }
    }

    #[test]
    fn test_audit_privacy_security_types() {
        let cli = parse_args(["entrenar", "audit", "model.bin", "--audit-type", "privacy"])
            .expect("parsing should succeed");
        match cli.command {
            crate::config::cli::Command::Audit(args) => {
                assert_eq!(args.audit_type, AuditType::Privacy);
            }
            _ => panic!("Expected Audit command"),
        }

        let cli = parse_args(["entrenar", "audit", "model.bin", "--audit-type", "security"])
            .expect("parsing should succeed");
        match cli.command {
            crate::config::cli::Command::Audit(args) => {
                assert_eq!(args.audit_type, AuditType::Security);
            }
            _ => panic!("Expected Audit command"),
        }
    }
}