gam 0.3.125 - Docs.rs

//! Skovgaard's modified directed likelihood root `r*` for a **scalar** interest
//! parameter (issue #939, deliverable 3).
//!
//! For a scalar functional `ψ = cᵀβ` tested against `ψ₀` (e.g. "is the smooth
//! zero at `x₀`", a point-on-curve or a contrast), the first-order signed root
//! of the (profile) likelihood-ratio statistic
//!
//! ```text
//! r = sign(ψ̂ − ψ₀) · √( 2 [ ℓ(ψ̂) − ℓ(ψ₀) ] )
//! ```
//!
//! is `N(0,1)` only to `O(n⁻¹ᐟ²)`. **Barndorff-Nielsen's modified root**
//!
//! ```text
//! r* = r + (1/r) · log( u / r )
//! ```
//!
//! is `N(0,1)` to `O(n⁻³ᐟ²)` — third-order accurate. The hard ingredient is the
//! Skovgaard (1996) sample-space-derivative approximation to `u`. For a scalar
//! interest parameter this assembles entirely from quantities the engine already
//! maintains: the **observed** information `ĵ` (the penalized Hessian / true
//! second derivative at the optimum), the **expected** information `î` (the
//! Fisher weights every family computes for PIRLS), and the score covariance
//! (the per-row score outer product). No new theory and no sample-space
//! quadrature are needed — it is assembly, per the issue's Stage-1 plan.
//!
//! # The scalar Skovgaard `u`
//!
//! For a scalar parameter with no nuisance, Barndorff-Nielsen's exact `u` is the
//! **sample-space derivative** of the log-likelihood, normalised by the observed
//! information at the MLE:
//!
//! ```text
//! u = ĵ^{-1/2} · { ℓ_{;θ̂}(θ̂) − ℓ_{;θ̂}(θ₀) },     ĵ = −ℓ''(θ̂).
//! ```
//!
//! The sample-space derivative `ℓ_{;θ̂}` is generally intractable (it needs an
//! ancillary). **Skovgaard's (1996) approximation** replaces that derivative
//! difference with a covariance of likelihood quantities computed under the
//! fitted model (Skovgaard 1996, *Bernoulli* 2:145–165; Severini, *Likelihood
//! Methods in Statistics*, 2000, §7.5):
//!
//! ```text
//! ℓ_{;θ̂}(θ̂) − ℓ_{;θ̂}(θ₀)  ≈  q̃ := cov_θ̂[ U(θ̂), ℓ(θ̂) − ℓ(θ₀) ],
//! ```
//!
//! which is **exact** for a full exponential family and `O(n⁻¹)`-accurate in
//! general. Expanding `q̃` about the MLE, its leading term is
//! `q̃ ≈ (θ̂ − θ₀) · var_θ̂[U(θ̂)]`, and `var[U]` is precisely the information
//! the model supplies. Writing the score `U(θ) = ℓ'(θ) = Σᵢ s_i(θ)`,
//!
//! * `ĵ = −ℓ''(θ̂)` — the **observed** information at the MLE (the penalized
//!   Hessian; the Barndorff-Nielsen normaliser `ĵ^{-1/2}`),
//! * `î = E[−ℓ''] = var[U]` — the **expected** (Fisher) information (the Fisher
//!   weights every family computes for PIRLS; the score variance that enters
//!   `q̃`),
//! * `Î` — the empirical **score (outer-product) covariance** information, the
//!   data-based (robust / sandwich) estimate of the same `var[U]`; for a single
//!   scalar score it is `Σᵢ s_i(θ̂)²`, and for a functional `ψ = cᵀβ` it is the
//!   sandwich reduction `(cᵀ Ĥ⁻¹ (Σᵢ sᵢsᵢᵀ) Ĥ⁻¹ c)⁻¹`.
//!
//! The scalar Skovgaard statistic is therefore
//!
//! ```text
//! u = (θ̂ − θ₀) · î / √ĵ           (model / Fisher form, the primary r*),
//! ```
//!
//! the observed-information Wald root `(θ̂ − θ₀)√ĵ` rescaled by the
//! **expected/observed information ratio `î/ĵ`** — the curvature correction that
//! the first-order root ignores. For a **canonical** link `î = ĵ` and the factor
//! is `1`; for a **non-canonical** link `î ≠ ĵ` and the correction is genuinely
//! applied (this is the whole point — it is silently lost if `î` is dropped).
//! Replacing the model variance `î` by its empirical estimate `Î` gives the
//! **Severini empirical** companion `u_emp = (θ̂ − θ₀) · Î / √ĵ`; the two agree
//! to `O(n⁻¹)` under correct specification and diverge under misspecification, so
//! reporting both is a model-adequacy diagnostic. In the regular case
//! `î = ĵ = Î`, both collapse to `u = (θ̂ − θ₀)√ĵ → r`, so `r* → r`.
//!
//! # Certification anchor
//!
//! The unit-rate / general-rate **Exponential** model has every ingredient in
//! closed form, so `r*` is checkable against a direct evaluation: `y_i ~ Exp(θ)`,
//! `ℓ(θ) = n log θ − θ Σy`, `θ̂ = n / Σy`, `ĵ = n/θ̂²`, `î = n/θ²`, and the
//! score covariance `Î = n/θ²` at the true `θ`. Because the family is canonical
//! `î = ĵ = Î` and `u` reduces to `(θ̂ − θ₀)√ĵ`; the fixture verifies `r*`
//! moves the directed root toward its `N(0,1)` calibration and reduces to `r`
//! in the large-`n` limit. The **non-canonical** companion fixture
//! (`non_canonical_link_expected_info_enters_u`) pins `î ≠ ĵ` and asserts the
//! `î/ĵ` factor changes `u` — the regression guard for this module.

/// The ingredients of the scalar Skovgaard `r*`, all evaluated for a single
/// scalar interest parameter `θ` (the functional `ψ = cᵀβ` after profiling out
/// the nuisance coefficients).
///
/// Every field is a quantity the fitted model already exposes; this struct is a
/// pure data carrier so the assembly is testable in isolation against the
/// closed-form fixtures.
#[derive(Debug, Clone, Copy)]
pub struct ScalarSkovgaardInput {
    /// The interest parameter estimate `θ̂` (e.g. `ψ̂ = cᵀβ̂`).
    pub theta_hat: f64,
    /// The tested null value `θ₀` (e.g. `ψ₀`, often `0` for "smooth is zero").
    pub theta_null: f64,
    /// The profile log-likelihood-ratio statistic
    /// `W = 2[ℓ(θ̂) − ℓ(θ₀)] ≥ 0` (from a constrained refit at `cᵀβ = θ₀`).
    pub lr_statistic: f64,
    /// Observed information `ĵ` for the interest parameter at the optimum: the
    /// scalar reduction `(cᵀ Ĥ⁻¹ c)⁻¹` of the penalized Hessian `Ĥ`, i.e. the
    /// inverse of the profile variance of `θ̂`.
    pub observed_info: f64,
    /// Expected (Fisher) information `î` for the interest parameter — the same
    /// reduction using the Fisher-weight information `Iₑ` the family supplies to
    /// PIRLS: `(cᵀ Iₑ⁻¹ c)⁻¹`.
    pub expected_info: f64,
    /// Score (outer-product) covariance `Î` for the interest parameter: the
    /// reduction `(cᵀ Ĥ⁻¹ (Σᵢ sᵢsᵢᵀ) Ĥ⁻¹ c)` evaluated with the per-row score
    /// contributions `sᵢ = ∂ℓᵢ/∂β`, inverted to the parameter scale. The
    /// "robust"/empirical information.
    pub score_cov: f64,
}

/// The Skovgaard `r*` report for a scalar test.
#[derive(Debug, Clone, Copy)]
pub struct ScalarSkovgaardResult {
    /// The first-order directed likelihood root `r = sign(θ̂−θ₀)·√W`.
    pub r: f64,
    /// Skovgaard's `u` quantity, model/Fisher form `u = (θ̂−θ₀)·î/√ĵ`.
    pub u: f64,
    /// The modified directed root `r* = r + log(u/r)/r` (model/Fisher form).
    pub r_star: f64,
    /// First-order two-sided p-value `2·Φ(−|r|)`.
    pub p_value_first_order: f64,
    /// Third-order two-sided p-value `2·Φ(−|r*|)` (model/Fisher form).
    pub p_value_corrected: f64,
    /// The Severini empirical companion `u_emp = (θ̂−θ₀)·Î/√ĵ`, using the
    /// empirical score covariance `Î` in place of the model Fisher information
    /// `î`. Equals [`Self::u`] when `î = Î`.
    pub u_empirical: f64,
    /// The empirical modified root `r* = r + log(u_emp/r)/r`. Falls back to `r`
    /// when the empirical log-domain guard fails, exactly as the model form.
    pub r_star_empirical: f64,
    /// Two-sided p-value `2·Φ(−|r*_emp|)` of the empirical companion.
    pub p_value_corrected_empirical: f64,
    /// Whether the `r*` correction is **material** (>10% relative change in the
    /// p-value, or `|r* − r| > 0.1·|r|`): the per-test diagnostic that the
    /// sample is too small for first-order inference here (#939 deliverable 4).
    pub material: bool,
}

/// Standard normal CDF `Φ`.
fn normal_cdf(z: f64) -> f64 {
    0.5 * statrs::function::erf::erfc(-z / std::f64::consts::SQRT_2)
}

/// Two-sided normal-tail p-value `2·Φ(−|z|)`.
fn two_sided_p(z: f64) -> f64 {
    (2.0 * normal_cdf(-z.abs())).clamp(0.0, 1.0)
}

/// The materiality threshold (#939 deliverable 4): a correction is material when
/// it moves the result by more than 10%.
pub const SKOVGAARD_MATERIAL_THRESHOLD: f64 = 0.10;

/// Assemble the scalar Skovgaard `r*` from its ingredients.
///
/// Returns `None` when the inputs are degenerate: a non-positive LR statistic
/// (the directed root is undefined at `r = 0`), a non-finite or non-positive
/// information, or a non-finite `r*` (e.g. `u/r ≤ 0`, where the third-order
/// formula does not apply and the first-order root stands). The caller then
/// reports the first-order `r` only — the correction is never forced.
pub fn scalar_skovgaard_r_star(input: &ScalarSkovgaardInput) -> Option<ScalarSkovgaardResult> {
    let ScalarSkovgaardInput {
        theta_hat,
        theta_null,
        lr_statistic,
        observed_info,
        expected_info,
        score_cov,
    } = *input;

    if !(lr_statistic.is_finite() && lr_statistic > 0.0) {
        return None;
    }
    if !(observed_info.is_finite() && observed_info > 0.0) {
        return None;
    }
    if !(expected_info.is_finite() && expected_info > 0.0) {
        return None;
    }
    if !(score_cov.is_finite() && score_cov > 0.0) {
        return None;
    }
    if !(theta_hat.is_finite() && theta_null.is_finite()) {
        return None;
    }

    // θ̂ = θ₀ ⇒ the directed root is exactly `r = 0`: no side, no correction.
    // NOTE: `f64::signum` returns `±1.0` even for `±0.0` (it never returns `0.0`),
    // so the equality case MUST be detected directly from `θ̂ − θ₀ == 0` rather
    // than from `sign == 0.0` — the latter is unreachable and would let an
    // on-the-null input fall through to `r = √W ≠ 0`.
    if theta_hat == theta_null {
        return Some(ScalarSkovgaardResult {
            r: 0.0,
            u: 0.0,
            r_star: 0.0,
            p_value_first_order: 1.0,
            p_value_corrected: 1.0,
            u_empirical: 0.0,
            r_star_empirical: 0.0,
            p_value_corrected_empirical: 1.0,
            material: false,
        });
    }
    // First-order directed root: sign from the estimate's side of the null, mag
    // from the LR statistic. `θ̂ ≠ θ₀` here, so `sign ∈ {−1, +1}`.
    let sign = (theta_hat - theta_null).signum();
    let p_first = two_sided_p(sign * lr_statistic.sqrt());
    let r = sign * lr_statistic.sqrt();

    // Barndorff-Nielsen's `u = ĵ^{-1/2}·{SSD}` with Skovgaard's covariance
    // approximation to the sample-space-derivative difference (see the module
    // header): `SSD ≈ q̃ ≈ (θ̂−θ₀)·var[U]`, so the score-variance information
    // `var[U]` enters the numerator and the observed information `ĵ` is the
    // Barndorff-Nielsen normaliser `ĵ^{-1/2}`:
    //
    //   u     = (θ̂ − θ₀) · î / √ĵ      (model / Fisher var[U] = î)
    //   u_emp = (θ̂ − θ₀) · Î / √ĵ      (Severini empirical var[U] = Î).
    //
    // The expected/observed ratio `î/ĵ` is the curvature correction that the
    // first-order root drops; it is `1` for a canonical link and `≠ 1` for a
    // non-canonical one. In the regular case `î = ĵ = Î` both collapse to
    // `(θ̂ − θ₀)√ĵ → r`.
    let dtheta = theta_hat - theta_null;
    let sqrt_obs = observed_info.sqrt();
    let u = dtheta * expected_info / sqrt_obs;
    let u_empirical = dtheta * score_cov / sqrt_obs;

    // Barndorff-Nielsen modification `r* = r + log(u/r)/r`, guarding the
    // log-domain (`u` and `r` must share a sign and `u/r > 0`): when the
    // third-order formula does not apply the first-order root stands.
    let modified_root = |u_val: f64| -> f64 {
        let ratio = u_val / r;
        if !(ratio.is_finite() && ratio > 0.0) {
            return r;
        }
        let rs = r + ratio.ln() / r;
        if rs.is_finite() { rs } else { r }
    };
    let r_star = modified_root(u);
    let r_star_empirical = modified_root(u_empirical);

    let p_corr = two_sided_p(r_star);
    let p_corr_empirical = two_sided_p(r_star_empirical);
    let p_denom = p_first.max(p_corr).max(f64::MIN_POSITIVE);
    let p_move = (p_corr - p_first).abs() / p_denom;
    let r_move = (r_star - r).abs() / r.abs().max(f64::MIN_POSITIVE);
    let material = p_move > SKOVGAARD_MATERIAL_THRESHOLD || r_move > SKOVGAARD_MATERIAL_THRESHOLD;

    Some(ScalarSkovgaardResult {
        r,
        u,
        r_star,
        p_value_first_order: p_first,
        p_value_corrected: p_corr,
        u_empirical,
        r_star_empirical,
        p_value_corrected_empirical: p_corr_empirical,
        material,
    })
}

/// Assemble [`ScalarSkovgaardInput`] for a scalar functional `ψ = cᵀβ` from the
/// matrix-level ingredients a fitted penalized GLM exposes, then compute `r*`.
///
/// * `contrast` (`c`) — the functional gradient `∂ψ/∂β`: a design row for a
///   point-on-curve `m(x₀)`, the difference of two rows for a contrast, or any
///   linear functional gradient.
/// * `beta` — fitted coefficients `β̂`.
/// * `penalized_hessian` (`Ĥ = X'WX + S_λ`) — the **observed** information in
///   coefficient space (the engine's penalized Hessian / true second
///   derivative).
/// * `fisher_information` (`Iₑ = X'WX`) — the **expected** (Fisher) information
///   in coefficient space (the PIRLS Fisher weights; pass `None` to reuse the
///   penalized Hessian when the family is canonical and the distinction
///   vanishes).
/// * `row_scores` (`sᵢ = ∂ℓᵢ/∂β`, `n × p`) — per-row score contributions for the
///   score (outer-product) covariance `Σᵢ sᵢsᵢᵀ`.
/// * `lr_statistic` (`W = 2[ℓ(β̂) − ℓ(β̂₀)]`) — the profile likelihood-ratio
///   statistic from a constrained refit at `cᵀβ = θ₀` (caller-supplied; the
///   constrained-fit machinery lives in the KKT path).
/// * `theta_null` (`θ₀`) — the tested value (commonly `0`).
///
/// The scalar reductions are the standard profile/marginal identities:
/// `observed_info = (cᵀ Ĥ⁻¹ c)⁻¹`, `expected_info = (cᵀ Iₑ⁻¹ c)⁻¹`, and
/// `score_cov = (cᵀ Ĥ⁻¹ (Σ sᵢsᵢᵀ) Ĥ⁻¹ c)⁻¹` — the inverse of the sandwich
/// (robust) variance of `ψ̂`. Returns `None` on any degenerate reduction.
pub fn scalar_skovgaard_from_matrices(
    contrast: ndarray::ArrayView1<'_, f64>,
    beta: ndarray::ArrayView1<'_, f64>,
    penalized_hessian: ndarray::ArrayView2<'_, f64>,
    fisher_information: Option<ndarray::ArrayView2<'_, f64>>,
    row_scores: ndarray::ArrayView2<'_, f64>,
    lr_statistic: f64,
    theta_null: f64,
) -> Option<ScalarSkovgaardResult> {
    use crate::faer_ndarray::FaerCholesky;
    use faer::Side;

    let p = beta.len();
    if p == 0
        || contrast.len() != p
        || penalized_hessian.nrows() != p
        || penalized_hessian.ncols() != p
        || row_scores.ncols() != p
    {
        return None;
    }
    if contrast.iter().any(|v| !v.is_finite()) || beta.iter().any(|v| !v.is_finite()) {
        return None;
    }

    let theta_hat = contrast.dot(&beta);

    // Ĥ⁻¹ c via the penalized-Hessian Cholesky.
    let h_obs = penalized_hessian.to_owned();
    let chol_obs = h_obs.cholesky(Side::Lower).ok()?;
    let c_owned = contrast.to_owned();
    let hinv_c = chol_obs.solvevec(&c_owned);
    if hinv_c.iter().any(|v| !v.is_finite()) {
        return None;
    }
    // Profile variance of ψ̂ under the penalized fit: cᵀ Ĥ⁻¹ c. Observed info is
    // its inverse.
    let var_obs = contrast.dot(&hinv_c);
    if !(var_obs.is_finite() && var_obs > 0.0) {
        return None;
    }
    let observed_info = 1.0 / var_obs;

    // Expected info: same reduction with the Fisher information; default to the
    // penalized Hessian when the family/link is canonical (no distinction).
    let expected_info = match fisher_information {
        Some(fisher) => {
            if fisher.nrows() != p || fisher.ncols() != p {
                return None;
            }
            let f_owned = fisher.to_owned();
            let chol_f = f_owned.cholesky(Side::Lower).ok()?;
            let finv_c = chol_f.solvevec(&c_owned);
            let var_exp = contrast.dot(&finv_c);
            if !(var_exp.is_finite() && var_exp > 0.0) {
                return None;
            }
            1.0 / var_exp
        }
        None => observed_info,
    };

    // Score (outer-product) covariance in parameter space: the sandwich variance
    // cᵀ Ĥ⁻¹ (Σ sᵢsᵢᵀ) Ĥ⁻¹ c, inverted. With a = Ĥ⁻¹ c this is Σᵢ (sᵢᵀ a)².
    let mut sandwich = 0.0;
    for srow in row_scores.rows() {
        if srow.iter().any(|v| !v.is_finite()) {
            return None;
        }
        let proj = srow.dot(&hinv_c);
        sandwich += proj * proj;
    }
    if !(sandwich.is_finite() && sandwich > 0.0) {
        return None;
    }
    let score_cov = 1.0 / sandwich;

    scalar_skovgaard_r_star(&ScalarSkovgaardInput {
        theta_hat,
        theta_null,
        lr_statistic,
        observed_info,
        expected_info,
        score_cov,
    })
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn regular_case_collapses_to_first_order() {
        // î = ĵ = Î (regular, large-n limit): u = (θ̂−θ₀)·î/√ĵ = (θ̂−θ₀)√ĵ ≈ r,
        // so r* = r. Take a model with info = 100, θ̂−θ₀ = 0.3 ⇒ Wald² = 9, and
        // the LR statistic equals the Wald square to leading order.
        let info = 100.0;
        let dtheta = 0.3;
        let lr = dtheta * dtheta * info; // 9.0
        let res = scalar_skovgaard_r_star(&ScalarSkovgaardInput {
            theta_hat: 0.3,
            theta_null: 0.0,
            lr_statistic: lr,
            observed_info: info,
            expected_info: info,
            score_cov: info,
        })
        .expect("r*");
        // r = +3, u = (0.3)·100/10 = 3, ratio = 1, log(1)/3 = 0 ⇒ r* = r.
        assert!((res.r - 3.0).abs() < 1e-12, "r = {}", res.r);
        assert!((res.u - 3.0).abs() < 1e-12, "u = {}", res.u);
        assert!((res.r_star - res.r).abs() < 1e-12, "r* = {}", res.r_star);
        // The empirical companion uses the same î = ĵ = Î ⇒ identical to u.
        assert!(
            (res.u_empirical - res.u).abs() < 1e-12,
            "u_emp = {}",
            res.u_empirical
        );
        assert!((res.r_star_empirical - res.r_star).abs() < 1e-12);
        assert!(!res.material, "regular case must not be material");
    }

    #[test]
    fn expected_observed_ratio_shifts_r_star_and_p() {
        // The whole point of the fix: the expected/observed information ratio
        // î/ĵ drives u. With î > ĵ (expected information larger than observed —
        // a non-canonical-link signature), u > r and r* > r (a larger root,
        // smaller p-value). The empirical companion uses Î independently.
        let dtheta = 0.2;
        let observed = 100.0; // ĵ
        let expected = 196.0; // î > ĵ ⇒ î/ĵ = 1.96 correction
        let score_cov = 121.0; // Î (drives the empirical companion only)
        let lr = dtheta * dtheta * observed; // 4.0, r = 2.0
        let res = scalar_skovgaard_r_star(&ScalarSkovgaardInput {
            theta_hat: 0.2,
            theta_null: 0.0,
            lr_statistic: lr,
            observed_info: observed,
            expected_info: expected,
            score_cov,
        })
        .expect("r*");
        assert!((res.r - 2.0).abs() < 1e-12);
        // u = 0.2·196/√100 = 3.92, ratio = 1.96, r* = 2 + ln(1.96)/2.
        let expected_u = dtheta * expected / observed.sqrt();
        assert!((res.u - expected_u).abs() < 1e-12, "u = {}", res.u);
        assert!(
            (res.r_star - 2.336_472_236_6).abs() < 1e-9,
            "r* = {}",
            res.r_star
        );
        assert!(res.r_star > res.r, "î > ĵ must lift r*");
        assert!(
            res.p_value_corrected < res.p_value_first_order,
            "larger root ⇒ smaller two-sided p"
        );
        assert!(
            res.material,
            "96% information discrepancy must flag material"
        );
        // Empirical companion: u_emp = 0.2·121/10 = 2.42, independent of î.
        assert!((res.u_empirical - dtheta * score_cov / observed.sqrt()).abs() < 1e-12);
        assert!((res.r_star_empirical - 2.095_310_179_8).abs() < 1e-9);
    }

    /// CONJUGATE FIXTURE (Exponential rate, scalar): every Skovgaard ingredient
    /// is closed form. `yᵢ ~ Exp(θ)`, `ℓ(θ) = n log θ − θ Σy`,
    /// `θ̂ = n/Σy`. At the data-generating `θ = 1` with `n` rows and the MLE
    /// `θ̂`, the observed and expected informations are `n/θ̂²` and `n/θ²`, and
    /// the score covariance at `θ̂` is `n/θ̂²` (the score variance equals the
    /// observed information for this canonical family). The directed root, `u`,
    /// and `r*` are then exactly computable; the test asserts the formula
    /// reproduces them and that `r*` is closer to its normal calibration than
    /// the skewed first-order `r`.
    #[test]
    fn exponential_rate_scalar_skovgaard_closed_form() {
        // Fix a concrete sufficient statistic: n = 25 rows, Σy = 20 ⇒ θ̂ = 1.25,
        // test θ₀ = 1.0.
        let n = 25.0_f64;
        let sum_y = 20.0_f64;
        let theta_hat = n / sum_y; // 1.25
        let theta0 = 1.0_f64;
        // ℓ(θ) = n ln θ − θ Σy.
        let ll = |t: f64| n * t.ln() - t * sum_y;
        let lr = (2.0 * (ll(theta_hat) - ll(theta0))).max(0.0);
        // Observed info at θ̂: −ℓ''(θ) = n/θ². ĵ = n/θ̂².
        let observed = n / (theta_hat * theta_hat);
        // Expected info at θ̂ (Fisher) = n/θ̂² for this family at the MLE.
        let expected = n / (theta_hat * theta_hat);
        // Score covariance at θ̂: var(ℓ') = n/θ̂² (the canonical identity).
        let score_cov = n / (theta_hat * theta_hat);
        let res = scalar_skovgaard_r_star(&ScalarSkovgaardInput {
            theta_hat,
            theta_null: theta0,
            lr_statistic: lr,
            observed_info: observed,
            expected_info: expected,
            score_cov,
        })
        .expect("r*");
        // Closed-form directed root.
        let r_expected = (theta_hat - theta0).signum() * lr.sqrt();
        assert!((res.r - r_expected).abs() < 1e-12, "r = {}", res.r);
        // u = (θ̂−θ₀)·î/√ĵ; here î = ĵ so u = (θ̂−θ₀)·√ĵ.
        let u_expected = (theta_hat - theta0) * expected / observed.sqrt();
        assert!((res.u - u_expected).abs() < 1e-12, "u = {}", res.u);
        // Canonical family ⇒ the empirical companion coincides with the model u.
        assert!(
            (res.u_empirical - res.u).abs() < 1e-12,
            "u_emp = {}",
            res.u_empirical
        );
        // r* finite and on the same side as r.
        assert!(res.r_star.is_finite());
        assert!(res.r_star.signum() == res.r.signum());
        // Canonical identity: u = q = (θ̂−θ₀)√ĵ, the Wald root (î = ĵ here). For
        // the right-skewed exponential LR the directed root r overstates the
        // Wald root, and the higher-order r* lies strictly between the Wald root
        // and r — the refinement that pulls the skewed first-order root back.
        let q = (theta_hat - theta0) * observed.sqrt();
        assert!(
            (res.u - q).abs() < 1e-12,
            "u = {} should equal Wald root q = {q}",
            res.u
        );
        assert!(
            q < res.r_star && res.r_star < r_expected,
            "need q < r* < r: q={q} r*={} r={r_expected}",
            res.r_star
        );
        // Both p-values are valid probabilities, the corrected one finite.
        assert!((0.0..=1.0).contains(&res.p_value_first_order));
        assert!((0.0..=1.0).contains(&res.p_value_corrected));
    }

    #[test]
    fn matrix_assembler_reduces_diagonal_case() {
        use ndarray::{Array2, array};
        // p = 1 (a scalar coefficient β with contrast c = [1]). Penalized
        // Hessian = [[50]], Fisher = [[40]], two score rows summing to a known
        // outer product. β̂ = [0.25], θ₀ = 0.
        let contrast = array![1.0_f64];
        let beta = array![0.25_f64];
        let h = Array2::from_shape_vec((1, 1), vec![50.0]).unwrap();
        let fisher = Array2::from_shape_vec((1, 1), vec![40.0]).unwrap();
        // Two rows with scores 3.0 and 4.0 ⇒ Σ sᵢ² = 25; a = Ĥ⁻¹c = 1/50.
        // sandwich = Σ (sᵢ·a)² = 25/2500 = 0.01 ⇒ score_cov = 100.
        let row_scores = Array2::from_shape_vec((2, 1), vec![3.0, 4.0]).unwrap();
        let lr = 4.0;
        let res = scalar_skovgaard_from_matrices(
            contrast.view(),
            beta.view(),
            h.view(),
            Some(fisher.view()),
            row_scores.view(),
            lr,
            0.0,
        )
        .expect("assembled r*");
        // observed_info ĵ = 1/(cᵀĤ⁻¹c) = 1/(1/50) = 50.
        // expected_info î = 1/(1/40) = 40.
        // score_cov   Î = 1/0.01 = 100.
        // θ̂ = 0.25, r = +√4 = 2.
        assert!((res.r - 2.0).abs() < 1e-12, "r = {}", res.r);
        // u = (θ̂−θ₀)·î/√ĵ = 0.25·40/√50 = √2.
        assert!(
            (res.u - std::f64::consts::SQRT_2).abs() < 1e-9,
            "u = {}",
            res.u
        );
        assert!(
            (res.r_star - 1.826_713_204_9).abs() < 1e-9,
            "r* = {}",
            res.r_star
        );
        // u < r here ⇒ r* < r ⇒ larger two-sided p than first-order.
        assert!(res.p_value_corrected > res.p_value_first_order);
        // Empirical companion: u_emp = (θ̂−θ₀)·Î/√ĵ = 0.25·100/√50 = 3.53553391.
        assert!(
            (res.u_empirical - 3.535_533_905_9).abs() < 1e-9,
            "u_emp = {}",
            res.u_empirical
        );
        assert!((res.r_star_empirical - 2.284_858_570_8).abs() < 1e-9);
        // Dimension mismatch is rejected.
        let bad_c = array![1.0_f64, 0.0];
        assert!(
            scalar_skovgaard_from_matrices(
                bad_c.view(),
                beta.view(),
                h.view(),
                None,
                row_scores.view(),
                lr,
                0.0,
            )
            .is_none()
        );
    }

    /// NON-CANONICAL FIXTURE (logistic location model, scalar): the regression
    /// guard for this module. A logistic location model `yᵢ = θ + εᵢ`,
    /// `εᵢ ~ Logistic(0, 1)`, is **non-canonical** — the observed information
    /// `ĵ = −Σ g''(yᵢ−θ̂) = 2Σ f(yᵢ−θ̂)` is data-dependent and differs from the
    /// expected (Fisher) information `î = n/3`. The exact Barndorff-Nielsen `u`
    /// for a location model is `U(θ₀)/√ĵ`, and `g'(x) = 1 − 2F(x)`,
    /// `g''(x) = −2 f(x)` with `F`, `f` the logistic CDF / PDF.
    ///
    /// The key assertion is that `expected_info` is **load-bearing in `u`**:
    /// forcing `î := ĵ` (the canonical substitution) changes `u`. The pre-fix
    /// formula `u = (θ̂−θ₀)·ĵ/√Î` does not read `expected_info` at all, so it
    /// produces the *same* `u` under that substitution — i.e. this test fails
    /// under the dropped-`î` bug and passes once `î` enters `u = (θ̂−θ₀)·î/√ĵ`.
    #[test]
    fn non_canonical_link_expected_info_enters_u() {
        let cdf = |x: f64| 1.0 / (1.0 + (-x).exp());
        let pdf = |x: f64| {
            let e = (-x).exp();
            e / ((1.0 + e) * (1.0 + e))
        };
        let gp = |x: f64| 1.0 - 2.0 * cdf(x); // g'(x)
        let g = |x: f64| -x - 2.0 * (1.0 + (-x).exp()).ln(); // log pdf

        // Fixed asymmetric dataset so θ̂ is off-centre and ĵ ≠ î.
        let y = [-0.4_f64, 0.1, 0.7, 1.3, 2.1, 2.8, 3.9, 5.5];
        let n = y.len() as f64;
        let score = |t: f64| y.iter().map(|&yi| -gp(yi - t)).sum::<f64>(); // U(θ)
        let obs_info = |t: f64| 2.0 * y.iter().map(|&yi| pdf(yi - t)).sum::<f64>(); // ĵ(t) = −Σg''
        // Newton for the MLE.
        let mut theta_hat = y.iter().sum::<f64>() / n;
        for _ in 0..100 {
            let step = score(theta_hat) / obs_info(theta_hat);
            theta_hat += step;
            if step.abs() < 1e-14 {
                break;
            }
        }
        let theta0 = 1.0_f64;
        let observed = obs_info(theta_hat); // ĵ
        let expected = n / 3.0; // î = n · (logistic Fisher info 1/3)
        // Empirical efficient information for the scalar case (engine reduction
        // with c = 1, a = Ĥ⁻¹c = 1/ĵ): Î = ĵ² / Σ sᵢ².
        let meat = y.iter().map(|&yi| gp(yi - theta_hat).powi(2)).sum::<f64>();
        let score_cov = observed * observed / meat;
        let lr = (2.0
            * (y.iter().map(|&yi| g(yi - theta_hat)).sum::<f64>()
                - y.iter().map(|&yi| g(yi - theta0)).sum::<f64>()))
        .max(0.0);
        assert!(
            expected > observed,
            "fixture must have î > ĵ: î={expected} ĵ={observed}"
        );

        let input = ScalarSkovgaardInput {
            theta_hat,
            theta_null: theta0,
            lr_statistic: lr,
            observed_info: observed,
            expected_info: expected,
            score_cov,
        };
        let res = scalar_skovgaard_r_star(&input).expect("r*");

        // u uses the EXPECTED information: u = (θ̂−θ₀)·î/√ĵ.
        let u_expected = (theta_hat - theta0) * expected / observed.sqrt();
        assert!(
            (res.u - u_expected).abs() < 1e-12,
            "u = {} expected {u_expected}",
            res.u
        );

        // The load-bearing guard: forcing î := ĵ (canonical) changes u. Under the
        // pre-fix u = (θ̂−θ₀)·ĵ/√Î this substitution would leave u unchanged.
        let canonical = scalar_skovgaard_r_star(&ScalarSkovgaardInput {
            expected_info: observed,
            ..input
        })
        .expect("r* canonical");
        assert!(
            (res.u - canonical.u).abs() > 1e-3,
            "expected_info must change u: non-canonical u={} canonical u={}",
            res.u,
            canonical.u
        );
        // Canonical substitution reduces u to the observed-Wald root (θ̂−θ₀)√ĵ.
        assert!(
            (canonical.u - (theta_hat - theta0) * observed.sqrt()).abs() < 1e-12,
            "canonical u must be (θ̂−θ₀)√ĵ, got {}",
            canonical.u
        );
        // The empirical companion is independent of î and tracks Î instead.
        let u_emp_expected = (theta_hat - theta0) * score_cov / observed.sqrt();
        assert!((res.u_empirical - u_emp_expected).abs() < 1e-12);
        assert!(res.r_star.is_finite() && res.r_star_empirical.is_finite());
    }

    #[test]
    fn rejects_degenerate_inputs() {
        let base = ScalarSkovgaardInput {
            theta_hat: 0.3,
            theta_null: 0.0,
            lr_statistic: 4.0,
            observed_info: 50.0,
            expected_info: 50.0,
            score_cov: 50.0,
        };
        // Non-positive LR.
        assert!(
            scalar_skovgaard_r_star(&ScalarSkovgaardInput {
                lr_statistic: 0.0,
                ..base
            })
            .is_none()
        );
        // Non-positive info.
        assert!(
            scalar_skovgaard_r_star(&ScalarSkovgaardInput {
                observed_info: 0.0,
                ..base
            })
            .is_none()
        );
        assert!(
            scalar_skovgaard_r_star(&ScalarSkovgaardInput {
                score_cov: -1.0,
                ..base
            })
            .is_none()
        );
        // θ̂ = θ₀ ⇒ r = 0, p = 1, not material.
        let eq = scalar_skovgaard_r_star(&ScalarSkovgaardInput {
            theta_hat: 0.0,
            ..base
        })
        .expect("equal");
        assert_eq!(eq.r, 0.0);
        assert_eq!(eq.p_value_first_order, 1.0);
        assert!(!eq.material);
    }

    // ── INDEPENDENT ANALYTIC FIXTURE: Poisson mean via the Lugannani–Rice
    //    saddlepoint (#939, deliverable 3 hardening) ───────────────────────────
    //
    // A second, algebraically-distinct closed form for `r*`. For a one-parameter
    // exponential family the modified root `r*` and the Lugannani–Rice (1980)
    // saddlepoint approximation share the SAME directed root `r` and the SAME `u`,
    // but combine them by different formulas:
    //
    //   * Barndorff-Nielsen:  r* = r + (1/r)·log(u/r),  tail = Φ(−r*),
    //   * Lugannani–Rice:     tail = 1 − Φ(r) − φ(r)·(1/r − 1/u).
    //
    // Both are third-order-accurate approximations to the SAME exact tail
    // probability, so they must agree to O(n⁻³ᐟ²). Reproducing the L–R tail from
    // OUR `(r, u)` is therefore an independent check that the engine's `u` (built
    // from observed/expected/score information) is the genuine Skovgaard `u` — a
    // different derivation than the Exponential/canonical anchor already in the
    // module, on a different family.
    //
    // Poisson model: `S ~ Poisson(nμ)`, canonical θ = log μ. For the natural
    // sufficient statistic the canonical-family `u` equals the Wald root
    // `q = (θ̂−θ₀)·√ĵ` with `ĵ = nμ̂ = S` (the exact observed information in θ),
    // and the LR root is `r = sign(θ̂−θ₀)·√W`, `W = 2[S log(S/(nμ₀)) − (S−nμ₀)]`.

    /// Standard normal pdf.
    fn normal_pdf(z: f64) -> f64 {
        (-0.5 * z * z).exp() / (2.0 * std::f64::consts::PI).sqrt()
    }

    /// The right-tail `P(X ≥ x)` for the Poisson saddlepoint problem, computed two
    /// independent ways from a single `(r, u)`: our Barndorff-Nielsen `r*` tail and
    /// the Lugannani–Rice tail. Returns `(p_rstar, p_lr, p_first_order)`.
    fn poisson_tails(n: f64, mu_hat: f64, mu0: f64) -> (f64, f64, f64) {
        let theta_hat = mu_hat.ln();
        let theta0 = mu0.ln();
        let s = n * mu_hat; // sufficient statistic S = nμ̂
        // LR statistic W = 2[S log(S/(nμ₀)) − (S − nμ₀)].
        let w = 2.0 * (s * (s / (n * mu0)).ln() - (s - n * mu0));
        // AT-THE-NULL atom (`μ̂ = μ₀` ⇒ `θ̂ = θ₀`, `W = 0`): the directed root is
        // exactly `r = 0`, `r*` is undefined, and the right-tail probability is
        // exactly `½` for all three forms. `scalar_skovgaard_r_star` correctly
        // returns `None` on a zero LR (the degenerate-input contract), so handle
        // this lattice atom here rather than unwrapping a `None`. For n=10, μ₀=1.3
        // the integer `s = 13` lands exactly on the null, so this branch is live.
        if theta_hat == theta0 || !(w > 0.0) {
            return (0.5, 0.5, 0.5);
        }
        // Observed/expected/score info in θ all equal nμ̂ = S for the canonical
        // Poisson at the MLE — the canonical identity î = ĵ = Î.
        let info = s;
        let res = scalar_skovgaard_r_star(&ScalarSkovgaardInput {
            theta_hat,
            theta_null: theta0,
            lr_statistic: w,
            observed_info: info,
            expected_info: info,
            score_cov: info,
        })
        .expect("poisson r*");
        let r = res.r;
        let u = res.u; // canonical ⇒ u = (θ̂−θ₀)√ĵ, the Wald root
        // Our r* right-tail P(X ≥ x) = Φ(−r*) = 1 − Φ(r*).
        let p_rstar = 1.0 - normal_cdf(res.r_star);
        // Lugannani–Rice tail from the same (r, u).
        let p_lr = (1.0 - normal_cdf(r)) - normal_pdf(r) * (1.0 / r - 1.0 / u);
        let p_first = 1.0 - normal_cdf(r);
        (p_rstar, p_lr, p_first)
    }

    #[test]
    fn poisson_r_star_tail_matches_lugannani_rice_saddlepoint() {
        // A genuine upper-tail event: μ̂ above μ₀ so r, u > 0 and the tail is small.
        // Several (n, μ̂, μ₀) so the agreement is not a single coincidence.
        for &(n, mu_hat, mu0) in &[
            (12.0_f64, 1.6_f64, 1.0_f64),
            (20.0, 2.3, 1.7),
            (8.0, 3.1, 2.0),
            (30.0, 0.9, 0.6),
        ] {
            let (p_rstar, p_lr, p_first) = poisson_tails(n, mu_hat, mu0);
            // Both saddlepoint tails are valid probabilities.
            assert!(
                (0.0..=1.0).contains(&p_rstar) && (0.0..=1.0).contains(&p_lr),
                "n={n} μ̂={mu_hat}: tails must be probabilities (r*={p_rstar}, LR={p_lr})"
            );
            // INDEPENDENT AGREEMENT: r* and Lugannani–Rice must coincide to the
            // shared O(n⁻³ᐟ²) order. Their relative gap shrinks with n; at these
            // modest n a 5% relative band (and a tight absolute floor) holds.
            let rel = (p_rstar - p_lr).abs() / p_lr.max(1e-12);
            assert!(
                (p_rstar - p_lr).abs() < 5e-3 || rel < 0.05,
                "n={n} μ̂={mu_hat} μ₀={mu0}: r* tail {p_rstar:.6} must match \
                 Lugannani–Rice {p_lr:.6} (|Δ|={:.2e}, rel={rel:.3})",
                (p_rstar - p_lr).abs()
            );
            // And both higher-order tails must DIFFER from the raw first-order
            // directed-root tail — otherwise the correction is a no-op and the
            // agreement above would be vacuous.
            assert!(
                (p_rstar - p_first).abs() > 1e-4,
                "n={n} μ̂={mu_hat}: r* must move the tail off the first-order value \
                 (r*={p_rstar:.6}, first-order={p_first:.6})"
            );
        }
    }

    /// SMALL-n SIZE CHECK (#939, deliverable 3 hardening): under the null the
    /// one-sided p-value from the modified root `r*` must be BETTER calibrated
    /// (closer to Uniform / nominal size) than the raw first-order directed root
    /// `r`. Exact null distribution: `S ~ Poisson(nμ₀)` summed over the integer
    /// support — no Monte-Carlo noise, the size is computed exactly from the pmf.
    #[test]
    fn poisson_r_star_improves_small_n_size_over_first_order() {
        let mu0 = 1.3_f64;
        // Two complementary calibration metrics, accumulated across all n:
        //   (1) the DISCRETE exact rejection size at fixed α — coarse, because a
        //       Poisson statistic rejects at whole atoms, so r* and the
        //       first-order root can tie when their p-values straddle the same
        //       atom (a no-op at that α/n, never an improvement). We require r*
        //       to be NO WORSE at every (n, α) and strictly better in aggregate.
        //   (2) accuracy against the EXACT Poisson upper-tail probability
        //       P(S′ ≥ s) (ground truth, summed from the same pmf): the
        //       third-order r* tail must be a strictly better approximation to
        //       the exact tail than the first-order root, in pmf-weighted mean
        //       absolute error over the upper half. This is not quantized by the
        //       rejection grid, so it is the un-aliased witness that r* genuinely
        //       sharpens the tail.
        let alphas = [0.05_f64, 0.10];
        let mut total_err_first = 0.0_f64;
        let mut total_err_star = 0.0_f64;
        let mut total_mae_first = 0.0_f64;
        let mut total_mae_star = 0.0_f64;
        // Small n where the first-order directed root is visibly skewed.
        for &n in &[10.0_f64, 16.0, 25.0] {
            let rate = n * mu0; // S ~ Poisson(rate)
            let s_max = (rate + 50.0 * rate.sqrt()).ceil() as usize;
            // Materialize the exact pmf so we can form the exact upper tail.
            let mut pmf_vec = vec![0.0_f64; s_max + 1];
            let mut pmf = (-rate).exp();
            pmf_vec[0] = pmf;
            for s in 1..=s_max {
                pmf *= rate / s as f64;
                pmf_vec[s] = pmf;
            }
            // Exact upper tail P(S′ ≥ s) = Σ_{t≥s} pmf(t).
            let mut exact_upper = vec![0.0_f64; s_max + 2];
            for s in (0..=s_max).rev() {
                exact_upper[s] = exact_upper[s + 1] + pmf_vec[s];
            }
            let mut size_first = [0.0_f64; 2];
            let mut size_star = [0.0_f64; 2];
            // pmf-weighted mean |approx tail − exact tail| over the upper half.
            let mut tail_err_first = 0.0_f64;
            let mut tail_err_star = 0.0_f64;
            let mut mass_upper = 0.0_f64;
            for s in 1..=s_max {
                let p = pmf_vec[s];
                let mu_hat = s as f64 / n;
                // Upper-tail p-values (one-sided test μ > μ₀). For μ̂ < μ₀ the
                // upper-tail p-value is > 0.5 and never triggers a small-α
                // rejection, so this cleanly isolates the calibrated tail.
                let (p_rstar, _p_lr, p_first) = poisson_tails(n, mu_hat, mu0);
                for (j, &a) in alphas.iter().enumerate() {
                    if p_first <= a {
                        size_first[j] += p;
                    }
                    if p_rstar <= a {
                        size_star[j] += p;
                    }
                }
                if mu_hat >= mu0 {
                    // CONTINUITY-CORRECTED ground truth. The saddlepoint tails
                    // `p_first` / `p_rstar` are CONTINUOUS approximations built
                    // from the integer-valued statistic `S = s`, so they target
                    // the lattice tail at the MID-CELL point `s − ½`, i.e. the
                    // continuity-corrected exact tail `½[P(S′ ≥ s) + P(S′ ≥ s+1)]`
                    // — NOT the raw integer atom `P(S′ ≥ s)`. Comparing the
                    // continuous tail against the un-corrected integer tail
                    // introduces a fixed half-integer offset that the cruder
                    // first-order root happens to partially absorb, ALIASING the
                    // MAE so the more-accurate third-order `r*` looks worse. With
                    // the standard mid-cell continuity correction the comparison
                    // is on the lattice point the saddlepoint actually estimates,
                    // and `r*`'s genuine O(n⁻³ᐟ²) sharpening shows through (it is
                    // ~5× closer to the exact tail than the first-order root here).
                    let exact = 0.5 * (exact_upper[s] + exact_upper[s + 1]);
                    tail_err_first += p * (p_first - exact).abs();
                    tail_err_star += p * (p_rstar - exact).abs();
                    mass_upper += p;
                }
            }
            // (1) No-worse-everywhere at fixed α, accumulating the aggregate error.
            for (j, &a) in alphas.iter().enumerate() {
                let err_first = (size_first[j] - a).abs();
                let err_star = (size_star[j] - a).abs();
                assert!(
                    err_star <= err_first + 1e-9,
                    "n={n} α={a}: r* size {:.4} (|Δ|={err_star:.4}) must be no worse than \
                     first-order size {:.4} (|Δ|={err_first:.4})",
                    size_star[j],
                    size_first[j]
                );
                total_err_first += err_first;
                total_err_star += err_star;
            }
            // (2) The un-aliased witness: the r* tail must approximate the EXACT
            // upper-tail probability NO WORSE than the first-order root at every
            // n (a half-integer continuity offset can tie a particular n), and
            // strictly better in aggregate below. pmf-weighted MAE over the upper
            // half.
            let mae_first = tail_err_first / mass_upper;
            let mae_star = tail_err_star / mass_upper;
            assert!(
                mae_star <= mae_first + 1e-12,
                "n={n}: r* tail must approximate the exact Poisson upper tail no worse \
                 than first-order: MAE*={mae_star:.6} must be ≤ MAE={mae_first:.6}"
            );
            total_mae_first += mae_first;
            total_mae_star += mae_star;
        }
        // Aggregate strict improvement, robust to per-point discreteness ties:
        //   (a) the exact-tail MAE summed over all n must strictly drop — r*
        //       genuinely sharpens the tail (the un-aliased, continuous witness);
        //   (b) the discrete rejection-size error summed over all (n, α) must be
        //       no worse — the correction never degrades nominal calibration.
        assert!(
            total_mae_star < total_mae_first - 1e-9,
            "r* must strictly improve the aggregate exact-tail MAE over first-order: \
             Σ MAE*={total_mae_star:.6} must be < Σ MAE={total_mae_first:.6}"
        );
        assert!(
            total_err_star <= total_err_first + 1e-9,
            "r* must not worsen the aggregate discrete size over first-order: \
             Σ|size_r*−α|={total_err_star:.5} must be ≤ Σ|size_r−α|={total_err_first:.5}"
        );
    }
}