miplog 0.2.0 - Docs.rs

//! Tests that parse *generated* solver logs from `tests/fixtures/logs/`.
//!
//! Run `python3 tests/generate_logs.py` first to produce logs from whatever
//! solvers are installed locally.  In CI, the GitHub Actions workflow installs
//! the free solvers and runs the generator before `cargo test`.
//!
//! Each log is from solving p0201 (MIPLIB), a 201-variable binary program
//! with known optimal objective = 7615.

use miplog::{autodetect, Solver, Status};
use std::path::Path;

const LOGS_DIR: &str = "tests/fixtures/logs";
const EXPECTED_OBJ: f64 = 7615.0;
const OBJ_TOL: f64 = 1.0; // integer problem, allow rounding

/// Try to load and parse a log.  Returns None if the file doesn't exist
/// (solver wasn't available when logs were generated).
fn try_parse(solver_name: &str) -> Option<miplog::SolverLog> {
    let path = Path::new(LOGS_DIR).join(format!("{solver_name}.log"));
    if !path.exists() {
        eprintln!("skip {solver_name}: {path:?} not found (run generate_logs.py)");
        return None;
    }
    let text = std::fs::read_to_string(&path).unwrap_or_else(|e| panic!("read {path:?}: {e}"));
    let log = autodetect(&text).unwrap_or_else(|e| panic!("autodetect {solver_name}: {e}"));
    Some(log)
}

/// Common assertions that must hold for every solver on p0201.
fn assert_p0201(log: &miplog::SolverLog, expected_solver: Solver) {
    let name = expected_solver.key();

    // Solver detection
    assert_eq!(log.solver, expected_solver, "{name}: wrong solver");

    // Version — not always present (e.g. PySCIPOpt logfile omits the banner)
    // assert version only when log includes it
    if log.version.is_some() {
        eprintln!("{name}: version = {:?}", log.version);
    }

    // Termination — p0201 is small, every solver should find optimal
    assert_eq!(
        log.termination.status,
        Status::Optimal,
        "{name}: expected Optimal, got {:?} ({:?})",
        log.termination.status,
        log.termination.raw_reason,
    );

    // Objective bounds — optimal = 7615
    let primal = log
        .bounds
        .primal
        .unwrap_or_else(|| panic!("{name}: no primal"));
    assert!(
        (primal - EXPECTED_OBJ).abs() < OBJ_TOL,
        "{name}: primal {primal} != {EXPECTED_OBJ}",
    );
    if let Some(dual) = log.bounds.dual {
        assert!(
            (dual - EXPECTED_OBJ).abs() < OBJ_TOL,
            "{name}: dual {dual} != {EXPECTED_OBJ}",
        );
    }

    // Gap should be ~0
    if let Some(gap) = log.bounds.gap {
        assert!(gap < 0.01, "{name}: gap {gap} too large for optimal",);
    }

    // Wall time should be populated and reasonable (< 60s for this instance)
    let wall = log
        .timing
        .wall_seconds
        .unwrap_or_else(|| panic!("{name}: no wall time"));
    assert!(wall > 0.0, "{name}: wall time should be > 0");
    assert!(wall < 60.0, "{name}: wall time {wall}s suspiciously large");

    // Presolve — at least some dimension should be captured
    let pre = &log.presolve;
    assert!(
        pre.rows_before.is_some() || pre.rows_after.is_some(),
        "{name}: no presolve dims at all",
    );

    // Problem name — not always available (e.g. Gurobi LogFile doesn't
    // include the "Read MPS" line that contains the filename).
    if log.problem.is_some() {
        eprintln!("{name}: problem = {:?}", log.problem);
    }
}

// --- Per-solver tests (each skips if log not available) ---

#[test]
fn generated_highs() {
    if let Some(log) = try_parse("highs") {
        assert_p0201(&log, Solver::Highs);
        assert!(log.tree.nodes_explored.is_some(), "highs: no nodes");
        assert!(!log.progress.is_empty(), "highs: no progress rows");
        eprintln!(
            "highs: {} progress rows, {} nodes",
            log.progress.len(),
            log.tree.nodes_explored.unwrap_or(0)
        );
    }
}

#[test]
fn generated_scip() {
    if let Some(log) = try_parse("scip") {
        assert_p0201(&log, Solver::Scip);
        // SCIP progress parsing not yet implemented — just check summary
        if !log.progress.is_empty() {
            eprintln!("scip: {} progress rows", log.progress.len());
        }
        if let Some(n) = log.tree.solutions_found {
            assert!(n > 1, "scip: expected multiple solutions, got {n}");
            eprintln!("scip: {n} solutions");
        }
    }
}

#[test]
fn generated_gurobi() {
    if let Some(log) = try_parse("gurobi") {
        assert_p0201(&log, Solver::Gurobi);
        assert!(!log.progress.is_empty(), "gurobi: no progress rows");
        // Cuts may not appear in LogFile (Gurobi writes them to stdout)
        if !log.cuts.is_empty() {
            eprintln!("gurobi: {} cuts families", log.cuts.len());
        }
        assert!(
            log.tree.solutions_found.unwrap_or(0) > 1,
            "gurobi: expected multiple solutions",
        );
        eprintln!(
            "gurobi: {} progress rows, {} cuts families, {} solutions",
            log.progress.len(),
            log.cuts.len(),
            log.tree.solutions_found.unwrap_or(0)
        );
    }
}

#[test]
fn generated_copt() {
    if let Some(log) = try_parse("copt") {
        assert_p0201(&log, Solver::Copt);
        assert!(log.tree.nodes_explored.is_some(), "copt: no nodes");
        assert!(!log.progress.is_empty(), "copt: no progress rows");
        eprintln!(
            "copt: {} progress rows, {} nodes",
            log.progress.len(),
            log.tree.nodes_explored.unwrap_or(0)
        );
    }
}

#[test]
fn generated_cbc() {
    if let Some(log) = try_parse("cbc") {
        assert_p0201(&log, Solver::Cbc);
        eprintln!("cbc: {} progress rows", log.progress.len());
    }
}

#[test]
fn generated_cplex() {
    if let Some(log) = try_parse("cplex") {
        assert_p0201(&log, Solver::Cplex);
        assert!(!log.progress.is_empty(), "cplex: no progress rows");
        eprintln!("cplex: {} progress rows", log.progress.len());
    }
}

#[test]
fn generated_xpress() {
    if let Some(log) = try_parse("xpress") {
        assert_p0201(&log, Solver::Xpress);
        // Xpress progress table format varies by version
        if !log.progress.is_empty() {
            eprintln!("xpress: {} progress rows", log.progress.len());
        }
    }
}

#[test]
fn generated_mosek() {
    if let Some(log) = try_parse("mosek") {
        assert_p0201(&log, Solver::Mosek);
        eprintln!("mosek: wall={:.2}s", log.timing.wall_seconds.unwrap_or(0.0));
    }
}

/// Time-limit fixtures: every `*-timelimit.log` must parse with
/// `Status::TimeLimit`, a non-zero gap, and both bounds populated.
/// These exercise the parser code paths that don't fire on the
/// optimal-completion `*.log` fixtures.
#[test]
fn timelimit_fixtures_parse_as_time_limit() {
    let dir = Path::new(LOGS_DIR);
    if !dir.exists() {
        return;
    }
    let mut total = 0;
    for entry in std::fs::read_dir(dir).unwrap().flatten() {
        let path = entry.path();
        let n = path.file_name().unwrap().to_string_lossy().into_owned();
        if !n.ends_with("-timelimit.log") {
            continue;
        }
        total += 1;
        let text = std::fs::read_to_string(&path).unwrap();
        let log = autodetect(&text).unwrap_or_else(|e| panic!("autodetect {n}: {e}"));
        assert_eq!(
            log.termination.status,
            Status::TimeLimit,
            "{n}: expected TimeLimit, got {:?} ({:?})",
            log.termination.status,
            log.termination.raw_reason,
        );
        assert!(
            log.bounds.primal.is_some(),
            "{n}: time-limit run should have a primal incumbent",
        );
        assert!(
            log.bounds.dual.is_some(),
            "{n}: time-limit run should have a dual bound",
        );
        let gap = log.bounds.effective_gap().unwrap();
        assert!(
            gap > 0.001,
            "{n}: time-limit run should have a non-trivial gap, got {gap}",
        );
        let wall = log.timing.wall_seconds.unwrap_or(0.0);
        assert!(
            wall > 0.5,
            "{n}: wall_seconds {wall} suspiciously small for a time-limited run",
        );
    }
    assert!(
        total >= 4,
        "expected ≥4 -timelimit.log fixtures, found {total}"
    );
    eprintln!("verified {total} time-limit fixtures");
}

/// Node-limit fixtures: every `*-nodelimit.log` must parse with
/// `Status::OtherLimit`, both bounds populated, gap > 0, and `nodes_explored`
/// not wildly larger than the configured cap. Validates the
/// "stopped-by-non-time-limit" code path on each parser.
#[test]
fn nodelimit_fixtures_parse_as_other_limit() {
    let dir = Path::new(LOGS_DIR);
    if !dir.exists() {
        return;
    }
    let mut total = 0;
    for entry in std::fs::read_dir(dir).unwrap().flatten() {
        let path = entry.path();
        let n = path.file_name().unwrap().to_string_lossy().into_owned();
        if !n.ends_with("-nodelimit.log") {
            continue;
        }
        total += 1;
        let text = std::fs::read_to_string(&path).unwrap();
        let log = autodetect(&text).unwrap_or_else(|e| panic!("autodetect {n}: {e}"));
        assert_eq!(
            log.termination.status,
            Status::OtherLimit,
            "{n}: expected OtherLimit, got {:?} ({:?})",
            log.termination.status,
            log.termination.raw_reason,
        );
        assert!(log.bounds.primal.is_some(), "{n}: should have a primal");
        assert!(log.bounds.dual.is_some(), "{n}: should have a dual");
        let gap = log.bounds.effective_gap().unwrap_or(0.0);
        assert!(gap > 0.001, "{n}: should have a non-trivial gap, got {gap}");
    }
    assert!(
        total >= 4,
        "expected ≥4 -nodelimit.log fixtures, found {total}"
    );
    eprintln!("verified {total} node-limit fixtures");
}

/// `*-infeasible.log`: every fixture must classify as `Status::Infeasible`.
/// No assertion on bounds — solvers vary on whether they emit a primal/dual
/// for infeasible runs (some print +/- their inf sentinel).
#[test]
fn infeasible_fixtures_parse_as_infeasible() {
    let dir = Path::new(LOGS_DIR);
    if !dir.exists() {
        return;
    }
    let mut total = 0;
    for entry in std::fs::read_dir(dir).unwrap().flatten() {
        let path = entry.path();
        let n = path.file_name().unwrap().to_string_lossy().into_owned();
        if !n.ends_with("-infeasible.log") {
            continue;
        }
        total += 1;
        let text = std::fs::read_to_string(&path).unwrap();
        let log = autodetect(&text).unwrap_or_else(|e| panic!("autodetect {n}: {e}"));
        assert_eq!(
            log.termination.status,
            Status::Infeasible,
            "{n}: expected Infeasible, got {:?} ({:?})",
            log.termination.status,
            log.termination.raw_reason,
        );
    }
    assert!(
        total >= 4,
        "expected ≥4 -infeasible.log fixtures, found {total}"
    );
    eprintln!("verified {total} infeasible fixtures");
}

/// `*-concat.log`: Mittelmann-style bundles with three instance runs each
/// (p0201 optimal, glass4 time-limited, glass4 node-limited). Verifies
/// `input::split_concatenated` produces the expected entries and that each
/// chunk parses to its expected status.
#[test]
fn concat_fixtures_split_and_parse() {
    let dir = Path::new(LOGS_DIR);
    if !dir.exists() {
        return;
    }
    let mut total = 0;
    for entry in std::fs::read_dir(dir).unwrap().flatten() {
        let path = entry.path();
        let n = path.file_name().unwrap().to_string_lossy().into_owned();
        if !n.ends_with("-concat.log") {
            continue;
        }
        total += 1;
        let text = std::fs::read_to_string(&path).unwrap();
        let entries = miplog::input::split_concatenated(&text);
        assert_eq!(
            entries.len(),
            3,
            "{n}: expected 3 concat entries, got {}",
            entries.len(),
        );

        // Entry order matches build_concat_fixtures(): p0201, glass4-tl, glass4-nl.
        let want = [
            ("p0201.mps.gz", Status::Optimal),
            ("glass4.mps.gz", Status::TimeLimit),
            ("glass4.mps.gz", Status::OtherLimit),
        ];
        for (i, (expected_inst, expected_status)) in want.iter().enumerate() {
            let entry = &entries[i];
            assert!(
                entry.instance.ends_with(expected_inst),
                "{n}[{i}]: instance {:?} doesn't end with {expected_inst}",
                entry.instance,
            );
            let log =
                autodetect(&entry.text).unwrap_or_else(|e| panic!("{n}[{i}]: parse failed: {e}"));
            assert_eq!(
                log.termination.status, *expected_status,
                "{n}[{i}] ({}): expected {expected_status:?}, got {:?}",
                entry.instance, log.termination.status,
            );
        }
    }
    assert!(
        total >= 4,
        "expected ≥4 -concat.log fixtures, found {total}"
    );
    eprintln!("verified {total} concatenated fixtures");
}

/// `*-lp.log`: pure-LP runs (no integer variables). Should classify as
/// `Status::Optimal` and have a primal objective. No B&B → progress table
/// can be empty, no cuts expected.
#[test]
fn lp_fixtures_parse_as_optimal_lp() {
    let dir = Path::new(LOGS_DIR);
    if !dir.exists() {
        return;
    }
    let mut total = 0;
    for entry in std::fs::read_dir(dir).unwrap().flatten() {
        let path = entry.path();
        let n = path.file_name().unwrap().to_string_lossy().into_owned();
        if !n.ends_with("-lp.log") {
            continue;
        }
        total += 1;
        let text = std::fs::read_to_string(&path).unwrap();
        let log = autodetect(&text).unwrap_or_else(|e| panic!("autodetect {n}: {e}"));
        assert_eq!(
            log.termination.status,
            Status::Optimal,
            "{n}: expected Optimal, got {:?} ({:?})",
            log.termination.status,
            log.termination.raw_reason,
        );
        let p = log
            .bounds
            .primal
            .unwrap_or_else(|| panic!("{n}: no primal"));
        // The tiny LP has known optimal -5 (within solver tolerance).
        assert!((p - (-5.0)).abs() < 0.01, "{n}: primal {p} ≠ -5",);
    }
    assert!(total >= 4, "expected ≥4 -lp.log fixtures, found {total}");
    eprintln!("verified {total} LP fixtures");
}

/// Every generated log must satisfy the documented Core (`verify_common`)
/// tier. A failure here means a parser isn't populating fields that the
/// schema promises as reliably cross-solver — file as a parser bug.
#[test]
fn generated_all_pass_verify_common() {
    let dir = Path::new(LOGS_DIR);
    if !dir.exists() {
        return;
    }
    let mut failures: Vec<String> = Vec::new();
    for entry in std::fs::read_dir(dir).unwrap().flatten() {
        let path = entry.path();
        if path.extension().map(|x| x == "log").unwrap_or(false) {
            let text = std::fs::read_to_string(&path).unwrap();
            let Ok(log) = autodetect(&text) else { continue };
            if let Err(missing) = log.verify_common() {
                let name = path.file_name().unwrap().to_string_lossy();
                failures.push(format!("{name}: missing {missing:?}"));
            }
        }
    }
    assert!(
        failures.is_empty(),
        "Core-tier gaps:\n  {}",
        failures.join("\n  "),
    );
}

/// Meta-test: at least one solver log should exist.
/// Prevents silent "all skipped" in a misconfigured CI.
#[test]
fn at_least_one_solver_log_exists() {
    let dir = Path::new(LOGS_DIR);
    if !dir.exists() {
        eprintln!("WARN: {LOGS_DIR} missing — run `python3 tests/generate_logs.py`");
        return;
    }
    let count = std::fs::read_dir(dir)
        .unwrap()
        .filter_map(|e| e.ok())
        .filter(|e| e.path().extension().map(|x| x == "log").unwrap_or(false))
        .count();
    assert!(
        count > 0,
        "No .log files in {LOGS_DIR} — run `python3 tests/generate_logs.py`",
    );
    eprintln!("Found {count} solver log(s) in {LOGS_DIR}");
}

/// Round-trip: parse → write JSON.gz → read back → compare.
#[test]
fn generated_roundtrip() {
    let dir = Path::new(LOGS_DIR);
    if !dir.exists() {
        return;
    }
    let tmp = std::env::temp_dir().join("miplog-generated-rt");
    std::fs::create_dir_all(&tmp).unwrap();

    for entry in std::fs::read_dir(dir).unwrap().flatten() {
        let path = entry.path();
        if path.extension().map(|x| x == "log").unwrap_or(false) {
            let text = std::fs::read_to_string(&path).unwrap();
            let log = match autodetect(&text) {
                Ok(l) => l,
                Err(_) => continue,
            };
            let stem = path.file_stem().unwrap().to_string_lossy();
            let gz = tmp.join(format!("{stem}.json.gz"));
            miplog::output::write_json_gz(&gz, &log).unwrap();
            let back = miplog::output::read_json(&gz).unwrap();
            assert_eq!(back.solver, log.solver, "{stem}: solver mismatch");
            assert_eq!(
                back.termination.status, log.termination.status,
                "{stem}: status mismatch",
            );
            assert_eq!(
                back.progress.len(),
                log.progress.len(),
                "{stem}: progress len mismatch",
            );
            eprintln!(
                "  roundtrip {stem}: ok ({} bytes)",
                gz.metadata().unwrap().len()
            );
        }
    }
}