piano 0.15.0 - Docs.rs

use std::collections::{HashMap, HashSet};
use std::io::IsTerminal;
use std::path::{Path, PathBuf};
use std::process;
use std::sync::atomic::{AtomicBool, Ordering};
use std::time::Duration;

use clap::{Parser, Subcommand};

use piano::build::{
    CargoTarget, build_instrumented, cargo_metadata, clean_stale_piano_files, find_current_package,
    find_project_root, find_target, prebuild_runtime, prebuild_runtime_from_path,
};
use piano::error::{Error, io_context};
use piano::report::{
    diff_runs, diff_runs_json, find_latest_run_file, find_latest_run_file_since,
    find_ndjson_by_run_id, format_json, format_per_thread_tables, format_table, load_latest_run,
    load_latest_runs_per_thread, load_ndjson, load_ndjson_per_thread, load_run, load_run_by_id,
    load_tagged_run, load_two_latest_runs, relative_time, resolve_tag, reverse_resolve_tag,
    save_tag,
};
use piano::resolve::{
    ResolveResult, ResolvedTarget, SkippedFunction, TargetSpec, module_prefix, qualify,
    resolve_targets,
};
#[derive(Parser)]
#[command(
    name = "piano",
    about = "Automated instrumentation-based profiling for Rust",
    version,
    after_help = "Workflow: piano profile [OPTIONS] (or: piano build, piano run, piano report)"
)]
struct Cli {
    #[command(subcommand)]
    command: Commands,
}

#[derive(Parser)]
struct BuildOpts {
    /// Instrument functions whose name contains PATTERN (repeatable).
    /// e.g. --fn parse matches parse, parse_line, MyStruct::try_parse.
    #[arg(long = "fn", value_name = "PATTERN")]
    fn_patterns: Vec<String>,

    /// Match --fn patterns exactly instead of by substring.
    #[arg(long, requires = "fn_patterns")]
    exact: bool,

    /// Instrument all functions in a file (repeatable).
    #[arg(long = "file", value_name = "PATH")]
    file_patterns: Vec<PathBuf>,

    /// Instrument all functions in a module (repeatable).
    #[arg(long = "mod", value_name = "NAME")]
    mod_patterns: Vec<String>,

    /// Exclude functions by name from the measurement set (repeatable).
    /// Two-phase precedence: selectors pick the inclusion set, --skip removes from it.
    #[arg(long = "skip", value_name = "FUNC")]
    skip_patterns: Vec<String>,

    /// Limit instrumentation to functions at call-graph depth N or less.
    /// Depth 0 = entry points only.
    #[arg(long, value_name = "N")]
    depth: Option<usize>,

    /// Project root (auto-detected from Cargo.toml).
    #[arg(long)]
    project: Option<PathBuf>,

    /// Path to piano-runtime source (for development before publishing).
    #[arg(long)]
    runtime_path: Option<PathBuf>,

    /// Build and profile a specific binary target (for projects with multiple
    /// [[bin]] entries). Matches cargo's --bin flag.
    #[arg(long, conflicts_with = "example")]
    bin: Option<String>,

    /// Build and profile an example target. Matches cargo's --example flag.
    #[arg(long, conflicts_with = "bin")]
    example: Option<String>,

    /// Capture per-thread CPU time alongside wall time (Unix only).
    #[arg(long)]
    cpu_time: bool,

    /// Directory for profiling output files.
    /// Overrides PIANO_RUNS_DIR env var and the default (target/piano/runs/).
    #[arg(long, value_name = "DIR")]
    output_dir: Option<PathBuf>,

    /// Show functions excluded from instrumentation and exit.
    #[arg(long)]
    list_skipped: bool,
}

#[derive(Subcommand)]
enum Commands {
    /// Instrument and build the project. Profiles all functions by default;
    /// use --fn, --file, or --mod to narrow scope.
    Build {
        #[command(flatten)]
        opts: BuildOpts,
    },
    /// Execute the last-built instrumented binary.
    /// Pass arguments to the binary after --.
    Run {
        /// Stop profiling after N seconds (sends SIGTERM to the binary).
        #[arg(long, value_name = "SECONDS", value_parser = parse_duration_secs)]
        duration: Option<f64>,

        /// Grace period before escalating SIGTERM to SIGKILL (seconds).
        /// Set to 0 to disable escalation. Default: 10.
        #[arg(long, value_name = "SECONDS", default_value = "10", value_parser = parse_kill_timeout)]
        kill_timeout: f64,

        /// Directory for profiling output files.
        /// Overrides PIANO_RUNS_DIR env var and the default (target/piano/runs/).
        #[arg(long, value_name = "DIR")]
        output_dir: Option<PathBuf>,

        /// Arguments to pass to the instrumented binary (after --).
        #[arg(last = true)]
        args: Vec<String>,
    },
    /// Build, execute, and report in one step.
    /// Pass arguments to the binary after --.
    Profile {
        #[command(flatten)]
        opts: BuildOpts,

        /// Show all functions, including those with zero calls (disables --top limit).
        #[arg(long, conflicts_with = "top")]
        all: bool,

        /// Show top N functions by self-time (default: 10).
        #[arg(long, value_name = "N", conflicts_with = "all")]
        top: Option<usize>,

        /// Output structured JSON instead of a table.
        #[arg(long)]
        json: bool,

        /// Show per-thread breakdown instead of aggregated view.
        #[arg(long)]
        threads: bool,

        /// Suppress warning when program exits with non-zero code.
        #[arg(long)]
        ignore_exit_code: bool,

        /// Stop profiling after N seconds (sends SIGTERM to the binary).
        #[arg(long, value_name = "SECONDS", value_parser = parse_duration_secs)]
        duration: Option<f64>,

        /// Grace period before escalating SIGTERM to SIGKILL (seconds).
        /// Set to 0 to disable escalation. Default: 10.
        #[arg(long, value_name = "SECONDS", default_value = "10", value_parser = parse_kill_timeout)]
        kill_timeout: f64,

        /// Arguments to pass to the instrumented binary (after --).
        #[arg(last = true)]
        args: Vec<String>,
    },
    /// Show the latest profiling run (or a specific one).
    Report {
        /// Path to a specific run file. If omitted, shows the latest.
        run: Option<PathBuf>,

        /// Show all functions, including those with zero calls (disables --top limit).
        #[arg(long, conflicts_with = "top")]
        all: bool,

        /// Show top N functions by self-time (default: 10).
        #[arg(long, value_name = "N", conflicts_with = "all")]
        top: Option<usize>,

        /// Output structured JSON instead of a table.
        #[arg(long)]
        json: bool,

        /// Show per-thread breakdown instead of aggregated view.
        #[arg(long)]
        threads: bool,

        /// Show measured times without subtracting profiling overhead.
        #[arg(long)]
        uncorrected: bool,

        /// Directory for profiling output files.
        /// Overrides PIANO_RUNS_DIR env var and the default (target/piano/runs/).
        #[arg(long, value_name = "DIR")]
        output_dir: Option<PathBuf>,
    },
    /// Compare two profiling runs.
    Diff {
        /// First run (path or tag; omit both to compare two most recent runs).
        a: Option<PathBuf>,
        /// Second run (path or tag).
        b: Option<PathBuf>,

        /// Show all functions, including those with zero calls (disables --top limit).
        #[arg(long, conflicts_with = "top")]
        all: bool,

        /// Show top N functions by self-time (default: 10).
        #[arg(long, value_name = "N", conflicts_with = "all")]
        top: Option<usize>,

        /// Output structured JSON instead of a table.
        #[arg(long)]
        json: bool,

        /// Directory for profiling output files.
        /// Overrides PIANO_RUNS_DIR env var and the default (target/piano/runs/).
        #[arg(long, value_name = "DIR")]
        output_dir: Option<PathBuf>,
    },
    /// Tag the latest run, or list existing tags (no args).
    Tag {
        /// Tag name. If omitted, lists all saved tags.
        name: Option<String>,

        /// Directory for profiling output files.
        /// Overrides PIANO_RUNS_DIR env var and the default (target/piano/runs/).
        #[arg(long, value_name = "DIR")]
        output_dir: Option<PathBuf>,
    },
}

fn parse_duration_secs(s: &str) -> Result<f64, String> {
    let secs: f64 = s
        .parse()
        .map_err(|e: std::num::ParseFloatError| e.to_string())?;
    if secs.is_nan() || secs.is_infinite() {
        return Err("invalid duration".to_string());
    }
    if secs < 0.0 {
        return Err("duration cannot be negative".to_string());
    }
    if secs == 0.0 {
        return Err("duration cannot be zero".to_string());
    }
    if secs > std::time::Duration::MAX.as_secs_f64() {
        return Err("duration is too large".to_string());
    }
    Ok(secs)
}

fn parse_kill_timeout(s: &str) -> Result<f64, String> {
    let secs: f64 = s
        .parse()
        .map_err(|e: std::num::ParseFloatError| e.to_string())?;
    if secs.is_nan() || secs.is_infinite() {
        return Err("invalid timeout".to_string());
    }
    if secs < 0.0 {
        return Err("timeout cannot be negative".to_string());
    }
    Ok(secs)
}

/// Default number of functions shown in report output.
const DEFAULT_TOP_N: usize = 10;

/// Resolve `--all` and `--top N` flags into `(show_all, limit, show_footer)`.
///
/// - `--all`: show everything, no limit, no footer.
/// - `--top N`: show top N, hide zero-call entries, no footer.
/// - Neither: show top DEFAULT_TOP_N, hide zero-call entries, show footer.
fn resolve_display_limit(all: bool, top: Option<usize>) -> (bool, Option<usize>, bool) {
    if all {
        (true, None, false)
    } else {
        (false, Some(top.unwrap_or(DEFAULT_TOP_N)), top.is_none())
    }
}

fn main() {
    // Wrapper mode: when invoked as RUSTC_WORKSPACE_WRAPPER, Cargo passes
    // the real rustc path as argv[1]. Detect via PIANO_WRAPPER_CONFIG env var.
    if let Ok(config_path) = std::env::var(piano::wrapper::CONFIG_ENV) {
        std::process::exit(piano::wrapper::run_wrapper(&config_path));
    }

    let cli = Cli::parse();
    if let Err(e) = run(cli) {
        eprintln!("error: {e}");
        process::exit(1);
    }
}

fn run(cli: Cli) -> Result<(), Error> {
    let project_root = find_project_root(&std::env::current_dir()?).ok();
    match cli.command {
        Commands::Build { opts } => cmd_build(opts, &project_root),
        Commands::Run {
            duration,
            kill_timeout,
            output_dir,
            args,
        } => cmd_run(duration, kill_timeout, output_dir, args, &project_root),
        Commands::Profile {
            opts,
            all,
            top,
            json,
            threads,
            ignore_exit_code,
            duration,
            kill_timeout,
            args,
        } => {
            let (show_all, limit, show_footer) = resolve_display_limit(all, top);
            cmd_profile(
                opts,
                &project_root,
                show_all,
                limit,
                show_footer,
                json,
                threads,
                ignore_exit_code,
                duration,
                kill_timeout,
                args,
            )
        }
        Commands::Report {
            run,
            all,
            top,
            json,
            threads,
            uncorrected,
            output_dir,
        } => {
            let (show_all, limit, show_footer) = resolve_display_limit(all, top);
            cmd_report(
                run,
                show_all,
                limit,
                show_footer,
                json,
                threads,
                uncorrected,
                &project_root,
                output_dir,
            )
        }
        Commands::Diff {
            a,
            b,
            all,
            top,
            json,
            output_dir,
        } => {
            let (show_all, limit, show_footer) = resolve_display_limit(all, top);
            cmd_diff(
                a,
                b,
                show_all,
                limit,
                show_footer,
                json,
                &project_root,
                output_dir,
            )
        }
        Commands::Tag { name, output_dir } => cmd_tag(name, &project_root, output_dir),
    }
}

/// Deduplicate and sort skip reasons into a comma-separated string.
fn unique_skip_reasons(skipped: &[SkippedFunction]) -> String {
    skipped
        .iter()
        .map(|s| s.reason.to_string())
        .collect::<std::collections::BTreeSet<_>>()
        .into_iter()
        .collect::<Vec<_>>()
        .join(", ")
}

/// Pre-assign name_ids for all qualified functions, excluding main().
///
/// main() is the lifecycle boundary -- it creates the root context, not a profiled
/// function, so it is excluded from the name table.
///
/// Returns (name_ids, display_names, next_available_id).
fn assign_name_ids(
    all_qualified: &[piano::naming::QualifiedFunction],
    display_names: &[String],
) -> (HashMap<String, u32>, HashMap<String, String>, u32) {
    let mut next_id: u32 = 0;
    let mut name_ids: HashMap<String, u32> = HashMap::new();
    let mut displays: HashMap<String, String> = HashMap::new();
    for (qf, display) in all_qualified.iter().zip(display_names.iter()) {
        if qf.minimal == "main" {
            continue;
        }
        name_ids.entry(qf.minimal.clone()).or_insert_with(|| {
            let id = next_id;
            next_id += 1;
            id
        });
        displays
            .entry(qf.minimal.clone())
            .or_insert_with(|| display.clone());
    }
    (name_ids, displays, next_id)
}

/// Build an instrumented binary and return (binary_path, runs_dir, instrumented_fn_count).
///
/// Returns `Ok(None)` when `--list-skipped` is used (early exit after printing).
/// Build an instrumented binary.
///
/// Pipeline:
///   1. Resolve project path, cargo metadata, binary target, source dir
///   2. Resolve target functions (selectors, --skip, --list-skipped early exit)
///   3. Qualify names, disambiguate, assign numeric IDs, discover macro functions
///   4. Pre-build piano-runtime, clean stale files, create runs dir
///   5. Compute workspace-relative paths, assemble WrapperConfig, write config
///   6. Build with RUSTC_WORKSPACE_WRAPPER, warn about concurrency
fn build_project(
    opts: BuildOpts,
    project_root: &Option<PathBuf>,
) -> Result<Option<(PathBuf, PathBuf, usize)>, Error> {
    let BuildOpts {
        fn_patterns,
        exact,
        file_patterns,
        mod_patterns,
        skip_patterns,
        depth,
        project,
        runtime_path,
        bin,
        example,
        cpu_time,
        output_dir,
        list_skipped,
    } = opts;

    if depth.is_some() {
        return Err(Error::BuildFailed(
            "--depth requires call-graph analysis which is not yet implemented".into(),
        ));
    }

    let project = match project {
        Some(p) => p,
        None => project_root.clone().ok_or_else(|| {
            Error::BuildFailed("could not find Cargo.toml in any parent directory".into())
        })?,
    };

    if !project.exists() {
        return Err(Error::BuildFailed(format!(
            "project directory does not exist: {}",
            project.display()
        )));
    }
    let project = std::fs::canonicalize(&project).map_err(io_context("canonicalize", &project))?;

    // Build target specs from CLI args.
    let mut specs: Vec<TargetSpec> = Vec::new();
    for p in fn_patterns {
        specs.push(TargetSpec::Fn(p));
    }
    for p in file_patterns {
        specs.push(TargetSpec::File(p));
    }
    for m in mod_patterns {
        specs.push(TargetSpec::Mod(m));
    }

    // Use cargo metadata for project discovery.
    let metadata = cargo_metadata(&project)?;
    let workspace_root = metadata.workspace_root.canonicalize().map_err(|e| {
        Error::BuildFailed(format!(
            "failed to canonicalize workspace root {}: {e}",
            metadata.workspace_root.display()
        ))
    })?;

    // Find the target package and binary/example.
    let target_kind = if example.is_some() { "example" } else { "bin" };
    let target_name = example.as_deref().or(bin.as_deref());
    let (package_name, bin_src_path) = if target_name.is_some() || metadata.packages.len() == 1 {
        let pkg_filter = if metadata.packages.len() == 1 {
            None
        } else {
            find_current_package(&metadata, &project).map(|p| p.name.as_str())
        };
        find_target(&metadata, pkg_filter, target_name, target_kind)?
    } else {
        // Multiple packages, no --bin/--example: find the package matching project dir.
        let pkg = find_current_package(&metadata, &project).ok_or_else(|| {
            Error::BuildFailed(format!(
                "could not determine which package to build in workspace at {}",
                workspace_root.display()
            ))
        })?;
        find_target(&metadata, Some(&pkg.name), None, "bin")?
    };

    // Derive source directory from the binary's src_path.
    // The src_path points to the entry point (e.g., /ws/crates/core/src/main.rs).
    // The package's source root is the parent of "src/" in the path, or the
    // manifest_path parent.
    let pkg = metadata
        .packages
        .iter()
        .find(|p| p.name == package_name)
        .expect("package must exist: find_bin_target returned it");
    let pkg_root = pkg
        .manifest_path
        .parent()
        .ok_or_else(|| Error::BuildFailed("package manifest has no parent directory".into()))?;
    let pkg_root = pkg_root.canonicalize().map_err(|e| {
        Error::BuildFailed(format!(
            "failed to canonicalize package root {}: {e}",
            pkg_root.display()
        ))
    })?;

    // Determine the source directory. Use src/ if it exists, otherwise use the
    // parent of the binary's src_path relative to the package root.
    let src_dir = if pkg_root.join("src").is_dir() {
        pkg_root.join("src")
    } else {
        // Derive from binary src_path: strip pkg_root prefix, take first component.
        let bin_rel = bin_src_path
            .canonicalize()
            .unwrap_or_else(|_| bin_src_path.clone());
        bin_rel.parent().unwrap_or(&pkg_root).to_path_buf()
    };

    let ResolveResult {
        targets,
        skipped,
        all_functions,
    } = resolve_targets(&src_dir, &specs, exact)?;

    // Apply --skip: remove functions matching skip patterns from the measured set.
    // Two-phase precedence: selectors pick the inclusion set, --skip removes from it.
    let targets: Vec<ResolvedTarget> = if skip_patterns.is_empty() {
        targets
    } else {
        targets
            .into_iter()
            .filter_map(|mut t| {
                t.functions.retain(|qf| {
                    let bare = qf.minimal.rsplit("::").next().unwrap_or(&qf.minimal);
                    !skip_patterns
                        .iter()
                        .any(|skip| bare == skip.as_str() || qf.minimal == *skip)
                });
                if t.functions.is_empty() {
                    None
                } else {
                    Some(t)
                }
            })
            .collect()
    };

    if list_skipped {
        if skipped.is_empty() {
            eprintln!("no functions skipped");
        } else {
            for s in &skipped {
                println!("{}: {} ({})", s.path.display(), s.name, s.reason);
            }
        }
        return Ok(None);
    }

    if !specs.is_empty() && !skipped.is_empty() {
        eprintln!(
            "warning: {} function(s) skipped ({}) -- run piano build --list-skipped to see which",
            skipped.len(),
            unique_skip_reasons(&skipped)
        );
    }

    let total_fns: usize = targets.iter().map(|t| t.functions.len()).sum();
    eprintln!(
        "found {} function(s) across {} file(s)",
        total_fns,
        targets.len()
    );
    const INSTRUMENT_ALL_WARN_THRESHOLD: usize = 200;
    if specs.is_empty() && total_fns > INSTRUMENT_ALL_WARN_THRESHOLD {
        eprintln!(
            "warning: instrumenting {total_fns} functions may add overhead. \
             Use --fn, --file, or --mod to narrow scope"
        );
    }
    for target in &targets {
        let relative = target.file.strip_prefix(&src_dir).unwrap_or(&target.file);
        eprintln!("  {}:", relative.display());
        for qf in &target.functions {
            eprintln!("    {}", qf.minimal);
        }
    }

    let member_subdir = if pkg_root != workspace_root {
        Some(
            pkg_root
                .strip_prefix(&workspace_root)
                .map_err(|e| std::io::Error::other(e.to_string()))?
                .to_path_buf(),
        )
    } else {
        None
    };

    let src_rel = src_dir.strip_prefix(&pkg_root).unwrap_or(Path::new("src"));

    // Collect all QualifiedFunction entries with module prefixes applied,
    // then run progressive disambiguation to compute display names.
    let mut all_qualified: Vec<piano::naming::QualifiedFunction> = Vec::new();
    for target in &targets {
        let prefix = module_prefix(target.file.strip_prefix(&src_dir).unwrap_or(&target.file));
        for qf in &target.functions {
            all_qualified.push(piano::naming::QualifiedFunction::new(
                &qualify(&prefix, &qf.minimal),
                &qualify(&prefix, &qf.medium),
                &qualify(&prefix, &qf.full),
            ));
        }
    }
    let display_names = piano::naming::disambiguate(&all_qualified);

    let (global_name_ids, global_display_names, _next_id) =
        assign_name_ids(&all_qualified, &display_names);

    // TODO(rewriter-rebuild): macro function name discovery will be
    // reimplemented as part of the new guard-only rewriter.

    // Build set of all instrumentable function names across the entire workspace.
    // Uses all_functions (not just measured targets) so that non-measured functions
    // Build a set of measured function names (from targets) for quick lookup.
    let measured_names: HashSet<String> = targets
        .iter()
        .flat_map(|t| {
            let prefix = module_prefix(t.file.strip_prefix(&src_dir).unwrap_or(&t.file));
            t.functions
                .iter()
                .map(move |qf| qualify(&prefix, &qf.minimal))
        })
        .collect();

    // Pre-build piano-runtime with the user's toolchain.
    let target_dir = project.join("target").join("piano");
    eprintln!("pre-building piano-runtime...");
    let runtime = match runtime_path {
        Some(ref path) => {
            let abs_path = std::fs::canonicalize(path).map_err(io_context("canonicalize", path))?;
            prebuild_runtime_from_path(&abs_path, &project, &target_dir, &[])?
        }
        None => prebuild_runtime(&project, &target_dir, &[])?,
    };

    // Clean stale temp files from previous crashed runs.
    clean_stale_piano_files(&src_dir)?;
    piano::staging::clean_stale_staging(&target_dir);

    let runs_dir = match &output_dir {
        Some(dir) => dir.clone(),
        None => target_dir.join("runs"),
    };
    std::fs::create_dir_all(&runs_dir).map_err(io_context("create directory", &runs_dir))?;

    // Compute source paths relative to workspace root (matches what wrapper receives).
    let mut targets_relative: HashMap<PathBuf, HashMap<String, u32>> = HashMap::new();

    for af in &all_functions {
        let relative = af.file.strip_prefix(&src_dir).unwrap_or(&af.file);
        let prefix = module_prefix(relative);
        let measured: HashMap<String, u32> = af
            .functions
            .iter()
            .filter_map(|qf| {
                let qualified = qualify(&prefix, &qf.minimal);
                if measured_names.contains(&qualified) {
                    global_name_ids
                        .get(&qualified)
                        .map(|&id| (qf.minimal.clone(), id))
                } else {
                    None
                }
            })
            .collect();

        let ws_relative = if let Some(ref sub) = member_subdir {
            PathBuf::from(sub).join(src_rel).join(relative)
        } else {
            PathBuf::from(src_rel).join(relative)
        };

        targets_relative.insert(ws_relative, measured);
    }

    // Entry point path relative to workspace root
    let bin_src_canonical = bin_src_path.canonicalize().map_err(|e| {
        Error::BuildFailed(format!(
            "failed to canonicalize binary source path {}: {e}",
            bin_src_path.display()
        ))
    })?;
    let bin_entry_relative = bin_src_canonical
        .strip_prefix(&workspace_root)
        .map_err(|_| {
            Error::BuildFailed(format!(
                "binary source {} is outside workspace root {}",
                bin_src_canonical.display(),
                workspace_root.display()
            ))
        })?
        .to_path_buf();

    // Build the (id, display_name) name table sorted by id.
    let mut name_table: Vec<(u32, String)> = global_name_ids
        .iter()
        .map(|(qualified, &id)| {
            let display = global_display_names
                .get(qualified)
                .cloned()
                .unwrap_or_else(|| qualified.clone());
            (id, display)
        })
        .collect();
    name_table.sort_by_key(|(id, _)| *id);

    // Collect files that the wrapper will modify (for error remapping)
    let mut modified_files: std::collections::HashSet<std::path::PathBuf> =
        targets_relative.keys().cloned().collect();
    modified_files.insert(bin_entry_relative.clone());

    // Write wrapper config
    let config = piano::wrapper::WrapperConfig {
        runtime_rlib: runtime.rlib_path,
        runtime_deps_dir: runtime.deps_dir,
        entry_point: piano::wrapper::EntryPointConfig {
            source_path: bin_entry_relative,
            name_table,
            runs_dir: runs_dir.clone(),
            cpu_time,
        },
        targets: targets_relative,
    };

    let config_path = target_dir.join("config.json");
    let config_json = serde_json::to_string(&config)
        .map_err(|e| Error::BuildFailed(format!("failed to serialize wrapper config: {e}")))?;
    std::fs::write(&config_path, config_json)
        .map_err(io_context("write wrapper config", &config_path))?;

    // Build with wrapper
    let pkg_arg = if member_subdir.is_some() {
        Some(package_name.as_str())
    } else {
        None
    };
    let cargo_target = if let Some(ref ex) = example {
        Some(CargoTarget::Example(ex.as_str()))
    } else {
        bin.as_deref().map(CargoTarget::Bin)
    };
    let binary = build_instrumented(
        &workspace_root,
        &target_dir,
        pkg_arg,
        cargo_target,
        &config_path,
        &modified_files,
    )?;

    Ok(Some((binary, runs_dir, total_fns)))
}

fn cmd_build(opts: BuildOpts, project_root: &Option<PathBuf>) -> Result<(), Error> {
    let Some((binary, _runs_dir, _total_fns)) = build_project(opts, project_root)? else {
        return Ok(());
    };
    let display_name = binary
        .file_name()
        .map(|n| n.to_string_lossy().into_owned())
        .unwrap_or_else(|| binary.display().to_string());
    eprintln!("built: {display_name}");
    if !std::io::stdout().is_terminal() {
        println!("{}", binary.display());
    }

    Ok(())
}

/// Returns true if the given file extension belongs to a binary executable.
/// On Windows, `.exe` is a binary extension. On Unix, binaries have no extension
/// so this always returns false.
fn is_binary_extension(ext: &std::ffi::OsStr) -> bool {
    cfg!(windows) && ext == "exe"
}

fn find_latest_binary(project_root: &Option<PathBuf>) -> Result<PathBuf, Error> {
    let project = project_root.as_ref().ok_or(Error::NoBinary)?;
    let release_dir = project.join("target/piano/release");
    if !release_dir.is_dir() {
        return Err(Error::NoBinary);
    }
    let mut dirs = vec![release_dir.clone()];
    let examples_dir = release_dir.join("examples");
    if examples_dir.is_dir() {
        dirs.push(examples_dir);
    }
    let mut best: Option<(PathBuf, std::time::SystemTime)> = None;
    for dir in &dirs {
        let entries = std::fs::read_dir(dir).map_err(io_context("read directory", dir))?;
        for entry in entries {
            let entry = entry.map_err(io_context("read directory entry", dir))?;
            let path = entry.path();
            if !path.is_file() {
                continue;
            }
            if let Some(ext) = path.extension() {
                if !is_binary_extension(ext) {
                    continue;
                }
            }
            let meta = entry
                .metadata()
                .map_err(io_context("read metadata", &path))?;
            #[cfg(unix)]
            {
                use std::os::unix::fs::PermissionsExt;
                if meta.permissions().mode() & 0o111 == 0 {
                    continue;
                }
            }
            let mtime = meta
                .modified()
                .map_err(io_context("read modified time", &path))?;
            if best.as_ref().is_none_or(|(_, t)| mtime > *t) {
                best = Some((path, mtime));
            }
        }
    }
    best.map(|(p, _)| p).ok_or(Error::NoBinary)
}

/// Why the child process stopped.
enum StopReason {
    /// Child exited on its own (normal exit or crash).
    Normal,
    /// The `--duration` timeout expired; SIGTERM sent to child.
    Duration,
    /// User pressed Ctrl-C; SIGTERM forwarded to child.
    Interrupted,
    /// Child did not respond to SIGTERM within kill-timeout; escalated to SIGKILL.
    ForceKilled,
}

/// Result of running a child process, including why it stopped.
struct ChildOutcome {
    status: process::ExitStatus,
    stop_reason: StopReason,
}

/// Single global: set-once flag for Ctrl-C. One writer (signal handler),
/// one reader (polling loop). No PID, no cross-thread coordination.
static INTERRUPTED: AtomicBool = AtomicBool::new(false);

/// Terminate a child process (SIGTERM on Unix, TerminateProcess on Windows).
fn terminate_child(child: &process::Child) {
    #[cfg(unix)]
    // SAFETY: child.id() returns the PID from spawn. The child has not been
    // reaped by this process. Sending SIGTERM to a zombie is harmless (returns ESRCH).
    unsafe {
        libc::kill(child.id() as libc::pid_t, libc::SIGTERM);
    }

    #[cfg(windows)]
    // Note: TerminateProcess is an immediate kill (no graceful shutdown on Windows).
    // SAFETY: OpenProcess/TerminateProcess/CloseHandle with a valid PID from
    // Child::id(). Handle closed immediately after use.
    unsafe {
        extern "system" {
            fn OpenProcess(access: u32, inherit: i32, pid: u32) -> *mut std::ffi::c_void;
            fn TerminateProcess(handle: *mut std::ffi::c_void, exit_code: u32) -> i32;
            fn CloseHandle(handle: *mut std::ffi::c_void) -> i32;
        }
        const PROCESS_TERMINATE: u32 = 0x0001;
        let handle = OpenProcess(PROCESS_TERMINATE, 0, child.id());
        if !handle.is_null() {
            TerminateProcess(handle, 1);
            CloseHandle(handle);
        }
    }
}

/// Wait for a child to exit, escalating to SIGKILL after a grace period.
///
/// Polls try_wait in a loop. If the child doesn't exit within `grace`,
/// sends SIGKILL via Child::kill() and waits for exit.
fn wait_or_kill(
    child: &mut process::Child,
    grace: Duration,
    binary: &Path,
) -> Result<(process::ExitStatus, bool), Error> {
    if grace == Duration::ZERO {
        let status = child.wait().map_err(|e| {
            Error::RunFailed(format!("failed to wait for {}: {e}", binary.display()))
        })?;
        return Ok((status, false));
    }
    let start = std::time::Instant::now();
    loop {
        match child.try_wait() {
            Ok(Some(status)) => return Ok((status, false)),
            Ok(None) => {
                if start.elapsed() >= grace {
                    let _ = child.kill();
                    let status = child.wait().map_err(|e| {
                        Error::RunFailed(format!("failed to wait for {}: {e}", binary.display()))
                    })?;
                    return Ok((status, true));
                }
                std::thread::sleep(Duration::from_millis(10));
            }
            Err(e) => {
                return Err(Error::RunFailed(format!(
                    "failed to wait for {}: {e}",
                    binary.display()
                )));
            }
        }
    }
}

/// Spawn a child process, optionally killing it after a timeout.
///
/// Single-threaded polling loop. No background threads, no global PID.
/// The child is in the parent's process group, so terminal Ctrl-C delivers
/// SIGINT to both parent and child. For programmatic kill(pid, SIGINT),
/// only the parent receives it; the loop forwards SIGTERM to the child.
///
/// The only global state is INTERRUPTED (AtomicBool), set once by the
/// SIGINT handler so the parent survives Ctrl-C and collects the child's
/// exit status before reporting.
fn run_child(
    binary: &Path,
    args: &[String],
    timeout: Option<Duration>,
    kill_timeout: Duration,
    suppress_stdout: bool,
    env: &[(&str, &str)],
) -> Result<ChildOutcome, Error> {
    INTERRUPTED.store(false, Ordering::SeqCst);

    #[cfg(unix)]
    {
        extern "C" fn sigint_handler(_sig: i32) {
            INTERRUPTED.store(true, Ordering::SeqCst);
        }

        // SAFETY: sigaction with a valid handler function pointer.
        unsafe {
            let mut act: libc::sigaction = std::mem::zeroed();
            act.sa_sigaction = sigint_handler as *const () as usize;
            act.sa_flags = libc::SA_RESETHAND;
            libc::sigaction(libc::SIGINT, &act, std::ptr::null_mut());
        }
    }

    let mut cmd = process::Command::new(binary);
    cmd.args(args);
    for &(key, val) in env {
        cmd.env(key, val);
    }
    if suppress_stdout {
        cmd.stdout(process::Stdio::null());
    }

    let mut child = cmd
        .spawn()
        .map_err(|e| Error::RunFailed(format!("failed to run {}: {e}", binary.display())))?;

    if let Some(dur) = timeout {
        eprintln!("will stop after {}s", dur.as_secs_f64());
    }

    let start = std::time::Instant::now();
    let poll_interval = Duration::from_millis(10);
    let mut sigterm_sent_at: Option<std::time::Instant> = None;

    let outcome = loop {
        // 1. Check if child exited.
        match child.try_wait() {
            Ok(Some(status)) => {
                // Duration takes precedence over Interrupted when both are true
                // because the duration timeout was the root cause (it fired first).
                let stop_reason = if sigterm_sent_at.is_some() {
                    StopReason::Duration
                } else if INTERRUPTED.load(Ordering::SeqCst) {
                    StopReason::Interrupted
                } else {
                    StopReason::Normal
                };
                break ChildOutcome {
                    status,
                    stop_reason,
                };
            }
            Ok(None) => {}
            Err(e) => {
                return Err(Error::RunFailed(format!(
                    "failed to wait for {}: {e}",
                    binary.display()
                )));
            }
        }

        // 2. Duration timeout: send SIGTERM.
        if let Some(dur) = timeout {
            if sigterm_sent_at.is_none() && start.elapsed() >= dur {
                terminate_child(&child);
                sigterm_sent_at = Some(std::time::Instant::now());
            }
        }

        // 3. Ctrl-C: forward SIGTERM to child (terminal Ctrl-C sends to
        // process group, but programmatic kill(pid, SIGINT) only hits us).
        // Then wait for graceful exit, escalate to SIGKILL after kill_timeout.
        if INTERRUPTED.load(Ordering::SeqCst) {
            terminate_child(&child);
            let (status, force_killed) = wait_or_kill(&mut child, kill_timeout, binary)?;
            break ChildOutcome {
                status,
                stop_reason: if force_killed {
                    StopReason::ForceKilled
                } else {
                    StopReason::Interrupted
                },
            };
        }

        // 4. SIGKILL escalation after duration SIGTERM.
        if let Some(sent_at) = sigterm_sent_at {
            if kill_timeout > Duration::ZERO && sent_at.elapsed() >= kill_timeout {
                let _ = child.kill();
                let status = child.wait().map_err(|e| {
                    Error::RunFailed(format!("failed to wait for {}: {e}", binary.display()))
                })?;
                break ChildOutcome {
                    status,
                    stop_reason: StopReason::ForceKilled,
                };
            }
        }

        std::thread::sleep(poll_interval);
    };

    // Restore default SIGINT handler.
    #[cfg(unix)]
    // SAFETY: restoring SIG_DFL for SIGINT via sigaction.
    unsafe {
        let mut act: libc::sigaction = std::mem::zeroed();
        act.sa_sigaction = libc::SIG_DFL;
        libc::sigaction(libc::SIGINT, &act, std::ptr::null_mut());
    }

    Ok(outcome)
}

fn cmd_run(
    duration: Option<f64>,
    kill_timeout: f64,
    output_dir: Option<PathBuf>,
    args: Vec<String>,
    project_root: &Option<PathBuf>,
) -> Result<(), Error> {
    let binary = find_latest_binary(project_root)?;
    eprintln!("running: {}", binary.display());
    eprintln!("--- program output ---");

    // When --output-dir is provided, override the runs directory via env var
    // so the instrumented binary writes output there.
    let output_dir_str = output_dir
        .as_ref()
        .map(|d| d.to_string_lossy().into_owned());
    let env: Vec<(&str, &str)> = match &output_dir_str {
        Some(dir) => vec![("PIANO_RUNS_DIR", dir.as_str())],
        None => vec![],
    };

    let timeout = duration.map(Duration::from_secs_f64);
    let kill_dur = Duration::from_secs_f64(kill_timeout);
    let outcome = run_child(&binary, &args, timeout, kill_dur, false, &env)?;

    if matches!(outcome.stop_reason, StopReason::ForceKilled) {
        eprintln!("warning: program did not respond to SIGTERM -- terminated after --kill-timeout");
    }

    match outcome.stop_reason {
        StopReason::Duration | StopReason::ForceKilled => std::process::exit(0),
        StopReason::Interrupted => std::process::exit(130),
        StopReason::Normal => std::process::exit(outcome.status.code().unwrap_or(1)),
    }
}

#[allow(clippy::too_many_arguments)]
fn cmd_profile(
    opts: BuildOpts,
    project_root: &Option<PathBuf>,
    show_all: bool,
    limit: Option<usize>,
    show_footer: bool,
    json: bool,
    threads: bool,
    ignore_exit_code: bool,
    duration: Option<f64>,
    kill_timeout: f64,
    args: Vec<String>,
) -> Result<(), Error> {
    let Some((binary, runs_dir, total_fns)) = build_project(opts, project_root)? else {
        return Ok(());
    };
    let display_name = binary
        .file_name()
        .map(|n| n.to_string_lossy().into_owned())
        .unwrap_or_else(|| binary.display().to_string());
    eprintln!("built: {display_name}");
    eprintln!("--- program output ---");

    let profile_start_ms = std::time::SystemTime::now()
        .duration_since(std::time::UNIX_EPOCH)
        .unwrap_or_default()
        .as_millis();

    let child_env: Vec<(&str, &str)> = vec![];

    let timeout = duration.map(Duration::from_secs_f64);
    let kill_dur = Duration::from_secs_f64(kill_timeout);
    let outcome = run_child(&binary, &args, timeout, kill_dur, json, &child_env)?;
    let intentional_stop = matches!(
        outcome.stop_reason,
        StopReason::Duration | StopReason::Interrupted | StopReason::ForceKilled
    );

    if matches!(outcome.stop_reason, StopReason::ForceKilled) {
        eprintln!("warning: program did not respond to SIGTERM -- terminated after --kill-timeout");
    }

    if !outcome.status.success() && !ignore_exit_code && !intentional_stop {
        if let Some(code) = outcome.status.code() {
            eprintln!(
                "warning: program exited with code {code}; profiling results may be incomplete"
            );
        } else {
            eprintln!("warning: program terminated by signal; profiling results may be incomplete");
        }
    }

    // Point cmd_report at the project's runs directory so it works even when
    // CWD differs from the --project path. Skip if already set: the user
    // or test harness may have overridden it, and the runtime's shutdown_to()
    // respects PIANO_RUNS_DIR too.
    if std::env::var_os("PIANO_RUNS_DIR").is_none() {
        // SAFETY: single-threaded CLI at this point, no concurrent env reads.
        unsafe { std::env::set_var("PIANO_RUNS_DIR", &runs_dir) };
    }

    // Guard against stale data: if no run file was written during THIS run,
    // don't let cmd_report pick up a file from a previous run.
    let effective_runs_dir = default_runs_dir(project_root)?;
    if find_latest_run_file_since(&effective_runs_dir, profile_start_ms)?.is_none() {
        if !outcome.status.success() && !ignore_exit_code && !intentional_stop {
            // Program failed, no data -- suppress (UX principle 6).
            return Ok(());
        }
        if total_fns == 0 {
            return Err(Error::NoFunctionsInstrumented);
        }
        return Err(Error::NoDataWritten(effective_runs_dir));
    }

    eprintln!("--- profiling report ---");
    let report_result = match cmd_report(
        None,
        show_all,
        limit,
        show_footer,
        json,
        threads,
        false,
        project_root,
        None,
    ) {
        Ok(()) => Ok(()),
        Err(Error::NoRuns)
            if !outcome.status.success() && !ignore_exit_code && !intentional_stop =>
        {
            // Program failed and produced no data. The program's own error
            // output is the primary affordance (UX principle 6). Suppress
            // Piano's NoRuns to avoid cascading errors.
            //
            // When --ignore-exit-code is set, the user explicitly asked to
            // continue despite non-zero exit -- NoRuns should surface as
            // NoDataWritten so they know profiling failed.
            Ok(())
        }
        Err(Error::NoRuns) if total_fns == 0 => {
            // No functions were instrumented -- the binary ran but had
            // nothing to record.
            Err(Error::NoFunctionsInstrumented)
        }
        Err(Error::NoRuns) => {
            // Functions were instrumented but no data was written.
            // Something went wrong with the runtime's write -- give an
            // actionable message.
            Err(Error::NoDataWritten(runs_dir))
        }
        Err(e) => Err(e),
    };

    report_result?;

    if !outcome.status.success() && !ignore_exit_code && !intentional_stop {
        std::process::exit(outcome.status.code().unwrap_or(1));
    }

    Ok(())
}

#[allow(clippy::too_many_arguments)]
fn cmd_report(
    run_path: Option<PathBuf>,
    show_all: bool,
    limit: Option<usize>,
    show_footer: bool,
    json: bool,
    threads: bool,
    uncorrected: bool,
    project_root: &Option<PathBuf>,
    output_dir: Option<PathBuf>,
) -> Result<(), Error> {
    // When --output-dir is provided, set the env var so default_runs_dir picks it up.
    if let Some(ref dir) = output_dir {
        // SAFETY: single-threaded CLI -- no concurrent env reads.
        unsafe { std::env::set_var("PIANO_RUNS_DIR", dir) };
    }
    // Resolve the run file path.
    let resolved_path = match &run_path {
        Some(p) if p.exists() => Some(p.clone()),
        Some(p) => {
            // Tag lookup: resolve to NDJSON file if available.
            let tag = p.to_string_lossy();
            let tags_dir = default_tags_dir(project_root)?;
            let runs_dir = default_runs_dir(project_root)?;
            let run_id = resolve_tag(&tags_dir, &tag)?;
            match find_ndjson_by_run_id(&runs_dir, &run_id)? {
                Some(ndjson_path) => Some(ndjson_path),
                None => {
                    // No NDJSON file found; fall back to basic JSON table.
                    let run = load_run_by_id(&runs_dir, &run_id).map_err(|e| match e {
                        Error::NoRuns => Error::RunNotFound {
                            tag: tag.to_string(),
                        },
                        other => other,
                    })?;
                    if json {
                        println!("{}", format_json(&run, show_all, limit));
                    } else {
                        anstream::print!("{}", format_table(&run, show_all, limit, show_footer));
                    }
                    return Ok(());
                }
            }
        }
        None => {
            // Find the latest run file.
            let dir = default_runs_dir(project_root)?;
            find_latest_run_file(&dir)?
        }
    };

    // If we have a .ndjson file, load and display using Run-based formatters.
    if let Some(path) = &resolved_path
        && path.extension().and_then(|e| e.to_str()) == Some("ndjson")
    {
        if threads {
            let thread_runs = load_ndjson_per_thread(path, uncorrected)?;
            match thread_runs {
                Some(runs) => {
                    if json {
                        // Per-thread JSON: serialize each thread's Run as a JSON array.
                        let entries: Vec<_> = runs
                            .iter()
                            .enumerate()
                            .map(|(i, run)| {
                                serde_json::json!({
                                    "thread": i + 1,
                                    "functions": serde_json::from_str::<serde_json::Value>(
                                        &format_json(run, show_all, limit)
                                    ).unwrap_or_default()
                                })
                            })
                            .collect();
                        println!(
                            "{}",
                            serde_json::to_string_pretty(&entries)
                                .expect("JSON serialization should not fail")
                        );
                    } else {
                        anstream::print!(
                            "{}",
                            format_per_thread_tables(&runs, show_all, limit, show_footer)
                        );
                    }
                }
                None => {
                    eprintln!(
                        "warning: --threads requires per-thread data; this file predates thread tracking"
                    );
                    eprintln!("warning: showing aggregated view instead");
                    let (run, _completeness) = load_ndjson(path, uncorrected)?;
                    if json {
                        println!("{}", format_json(&run, show_all, limit));
                    } else {
                        anstream::print!("{}", format_table(&run, show_all, limit, show_footer));
                    }
                }
            }
        } else {
            let (run, _completeness) = load_ndjson(path, uncorrected)?;
            if json {
                println!("{}", format_json(&run, show_all, limit));
            } else {
                anstream::print!("{}", format_table(&run, show_all, limit, show_footer));
            }
        }
        return Ok(());
    }

    // Per-thread mode: load individual thread files without merging.
    if threads {
        let dir = default_runs_dir(project_root)?;
        let thread_runs = load_latest_runs_per_thread(&dir)?;
        anstream::print!(
            "{}",
            format_per_thread_tables(&thread_runs, show_all, limit, show_footer)
        );
        return Ok(());
    }

    // Fall back to JSON table.
    let run = match resolved_path {
        Some(p) => load_run(&p)?,
        None => {
            let dir = default_runs_dir(project_root)?;
            load_latest_run(&dir)?
        }
    };
    if json {
        println!("{}", format_json(&run, show_all, limit));
    } else {
        anstream::print!("{}", format_table(&run, show_all, limit, show_footer));
    }
    Ok(())
}

/// Derive a display label from a diff argument.
///
/// Tag names pass through as-is; file paths use the filename stem.
fn diff_label(arg: &Path) -> String {
    if arg.exists() {
        arg.file_stem()
            .map(|s| s.to_string_lossy().into_owned())
            .unwrap_or_else(|| arg.to_string_lossy().into_owned())
    } else {
        arg.to_string_lossy().into_owned()
    }
}

#[allow(clippy::too_many_arguments)]
fn cmd_diff(
    a: Option<PathBuf>,
    b: Option<PathBuf>,
    show_all: bool,
    limit: Option<usize>,
    _show_footer: bool,
    json: bool,
    project_root: &Option<PathBuf>,
    output_dir: Option<PathBuf>,
) -> Result<(), Error> {
    // When --output-dir is provided, set the env var so default_runs_dir picks it up.
    if let Some(ref dir) = output_dir {
        // SAFETY: single-threaded CLI -- no concurrent env reads.
        unsafe { std::env::set_var("PIANO_RUNS_DIR", dir) };
    }
    match (a, b) {
        (Some(a), Some(b)) => {
            let label_a = diff_label(&a);
            let label_b = diff_label(&b);
            let run_a = resolve_run_arg(&a, project_root)?;
            let run_b = resolve_run_arg(&b, project_root)?;
            if json {
                println!("{}", diff_runs_json(&run_a, &run_b, show_all, limit));
            } else {
                anstream::print!(
                    "{}",
                    diff_runs(&run_a, &run_b, &label_a, &label_b, show_all, limit)
                );
            }
        }
        (None, None) => {
            let runs_dir = default_runs_dir(project_root)?;
            let tags_dir = default_tags_dir(project_root).ok();
            let (previous, latest) = load_two_latest_runs(&runs_dir)?;

            if json {
                println!("{}", diff_runs_json(&previous, &latest, show_all, limit));
            } else {
                let label_a = resolve_diff_label(&tags_dir, &previous, &runs_dir, "previous");
                let label_b = resolve_diff_label(&tags_dir, &latest, &runs_dir, "latest");
                eprintln!("comparing: {label_a} vs {label_b}");
                anstream::print!(
                    "{}",
                    diff_runs(&previous, &latest, &label_a, &label_b, show_all, limit)
                );
            }
        }
        _ => {
            return Err(Error::DiffArgCount);
        }
    }
    Ok(())
}

/// Determine a display label for an auto-selected diff run.
///
/// Uses the tag name if a tag points to this run, otherwise falls back
/// to a relative timestamp with a role prefix ("previous (2 min ago)").
fn resolve_diff_label(
    tags_dir: &Option<PathBuf>,
    run: &piano::report::Run,
    runs_dir: &Path,
    role: &str,
) -> String {
    // Try reverse-resolving a tag.
    if let (Some(tags), Some(run_id)) = (tags_dir, &run.run_id) {
        if let Some(tag) = reverse_resolve_tag(tags, run_id) {
            return tag;
        }
    }

    // Fall back to relative timestamp from file modified time.
    let stem = run.timestamp_ms.to_string();
    for ext in &["ndjson", "json"] {
        let path = runs_dir.join(format!("{stem}.{ext}"));
        if let Ok(meta) = std::fs::metadata(&path) {
            if let Ok(modified) = meta.modified() {
                let rel = relative_time(modified);
                return format!("{role} ({rel})");
            }
        }
    }

    // Last resort: use the raw timestamp with role prefix.
    format!("{role} ({stem})")
}

fn cmd_tag(
    name: Option<String>,
    project_root: &Option<PathBuf>,
    output_dir: Option<PathBuf>,
) -> Result<(), Error> {
    // When --output-dir is provided, set the env var so default_runs_dir picks it up.
    if let Some(ref dir) = output_dir {
        // SAFETY: single-threaded CLI -- no concurrent env reads.
        unsafe { std::env::set_var("PIANO_RUNS_DIR", dir) };
    }
    let Some(name) = name else {
        let tags_dir = match default_tags_dir(project_root) {
            Ok(dir) => dir,
            Err(Error::NoRuns) => {
                eprintln!("no tags saved");
                return Ok(());
            }
            Err(e) => return Err(e),
        };
        let mut entries: Vec<String> = std::fs::read_dir(&tags_dir)
            .map_err(|source| Error::TagReadError {
                path: tags_dir.clone(),
                source,
            })?
            .filter_map(|entry| {
                let entry = entry.ok()?;
                if entry.file_type().ok()?.is_file() {
                    Some(entry.file_name().to_string_lossy().into_owned())
                } else {
                    None
                }
            })
            .collect();
        if entries.is_empty() {
            eprintln!("no tags saved");
            return Ok(());
        }
        entries.sort();
        for tag in &entries {
            println!("{tag}");
        }
        return Ok(());
    };

    let runs_dir = default_runs_dir(project_root)?;
    let tags_dir = default_tags_dir(project_root)?;
    let latest = load_latest_run(&runs_dir)?;
    let run_id = latest.run_id.ok_or(Error::NoRuns)?;
    save_tag(&tags_dir, &name, &run_id)?;
    eprintln!("tagged '{name}'");
    Ok(())
}

fn resolve_run_arg(
    arg: &Path,
    project_root: &Option<PathBuf>,
) -> Result<piano::report::Run, Error> {
    if arg.exists() {
        return load_run(arg);
    }
    let tag = arg.to_string_lossy();
    let tags_dir = default_tags_dir(project_root)?;
    let runs_dir = default_runs_dir(project_root)?;
    load_tagged_run(&tags_dir, &runs_dir, &tag)
}

fn default_runs_dir(project_root: &Option<PathBuf>) -> Result<PathBuf, Error> {
    if let Ok(dir) = std::env::var("PIANO_RUNS_DIR") {
        return Ok(PathBuf::from(dir));
    }
    let project = project_root.as_ref().ok_or(Error::NoRuns)?;
    let local = project.join("target/piano/runs");
    if local.is_dir() {
        return Ok(local);
    }
    Err(Error::NoRuns)
}

fn default_tags_dir(project_root: &Option<PathBuf>) -> Result<PathBuf, Error> {
    let project = project_root.as_ref().ok_or(Error::NoRuns)?;
    let local = project.join("target/piano/tags");
    if local.is_dir() {
        return Ok(local);
    }
    // Auto-create tags dir if runs exist (tags live alongside runs)
    let runs_local = project.join("target/piano/runs");
    if runs_local.is_dir() {
        std::fs::create_dir_all(&local).map_err(io_context("create directory", &local))?;
        return Ok(local);
    }
    Err(Error::NoRuns)
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn is_binary_extension_exe() {
        let ext = std::ffi::OsStr::new("exe");
        // On the current platform, the result depends on cfg!(windows).
        // On Windows: .exe is a binary extension -> true.
        // On Unix: no extension counts as binary, .exe is not -> false.
        assert_eq!(is_binary_extension(ext), cfg!(windows));
    }

    #[test]
    fn is_binary_extension_rejects_non_binary() {
        for name in &["d", "fingerprint", "rmeta", "rlib", "o", "so", "dylib"] {
            let ext = std::ffi::OsStr::new(name);
            assert!(
                !is_binary_extension(ext),
                "extension .{name} should not be treated as binary"
            );
        }
    }

    #[test]
    fn parse_duration_zero() {
        let err = parse_duration_secs("0").unwrap_err();
        assert_eq!(err, "duration cannot be zero");
    }

    #[test]
    fn parse_duration_negative() {
        let err = parse_duration_secs("-1").unwrap_err();
        assert_eq!(err, "duration cannot be negative");
    }

    #[test]
    fn parse_duration_nan() {
        let err = parse_duration_secs("nan").unwrap_err();
        assert_eq!(err, "invalid duration");
    }

    #[test]
    fn parse_duration_inf() {
        let err = parse_duration_secs("inf").unwrap_err();
        assert_eq!(err, "invalid duration");
    }

    #[test]
    fn parse_duration_neg_inf() {
        let err = parse_duration_secs("-inf").unwrap_err();
        assert_eq!(err, "invalid duration");
    }

    #[test]
    fn parse_duration_too_large() {
        let err = parse_duration_secs("1e300").unwrap_err();
        assert_eq!(err, "duration is too large");
    }

    #[test]
    fn parse_duration_negative_zero() {
        let err = parse_duration_secs("-0.0").unwrap_err();
        assert_eq!(err, "duration cannot be zero");
    }

    #[test]
    fn parse_duration_valid_fractional() {
        let secs = parse_duration_secs("0.5").unwrap();
        assert_eq!(secs, 0.5);
    }

    #[test]
    fn parse_duration_invalid_string() {
        assert!(parse_duration_secs("abc").is_err());
    }

    /// main() is excluded from the name table -- it is the lifecycle boundary that
    /// creates the root context, not a profiled function.
    #[test]
    fn name_table_excludes_main() {
        let all_qualified = vec![
            piano::naming::QualifiedFunction::new("main", "main", "main"),
            piano::naming::QualifiedFunction::new("process", "process", "process"),
            piano::naming::QualifiedFunction::new("db::query", "db::query", "db::query"),
        ];
        let display_names = piano::naming::disambiguate(&all_qualified);

        let (name_ids, display_map, _next_id) = assign_name_ids(&all_qualified, &display_names);

        assert!(
            !name_ids.contains_key("main"),
            "main must not appear in the name table"
        );
        assert!(
            !display_map.contains_key("main"),
            "main must not appear in the display names"
        );
        assert!(
            name_ids.contains_key("process"),
            "non-main functions must be in the name table"
        );
        assert!(
            name_ids.contains_key("db::query"),
            "module-qualified functions must be in the name table"
        );
    }
}