gam 0.3.125

Generalized penalized likelihood engine
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
124
125
126
127
128
129
130
131
132
133
134
135
136
137
138
139
140
141
142
143
144
145
146
147
148
149
150
151
152
153
154
155
156
157
158
159
160
161
162
163
164
165
166
167
168
169
170
171
172
173
174
175
176
177
178
179
180
181
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
207
208
209
210
211
212
213
214
215
216
217
218
219
220
221
222
223
224
225
226
227
228
229
230
231
232
233
234
235
236
237
238
239
240
241
242
243
244
245
246
247
248
249
250
251
252
253
254
255
256
257
258
259
260
261
262
263
264
265
266
267
268
269
270
271
272
273
274
275
276
277
278
279
280
281
282
283
284
285
286
287
288
289
290
291
292
293
294
295
296
297
298
299
300
301
302
303
304
305
306
307
308
309
310
311
312
313
314
315
316
317
318
319
320
321
322
323
324
325
326
327
328
329
330
331
332
333
334
335
336
337
338
339
340
341
342
343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
359
360
361
362
363
364
365
366
367
368
369
370
371
372
373
374
375
376
377
378
379
380
381
382
383
384
385
386
387
388
389
390
391
392
393
394
395
396
397
398
399
400
401
402
403
404
405
406
407
408
409
410
411
412
413
414
415
416
417
418
419
420
421
422
423
424
425
426
427
428
429
430
431
432
433
434
435
436
437
438
439
440
441
442
443
444
445
446
447
448
449
450
451
452
453
454
455
456
457
458
459
460
461
462
463
464
465
466
467
468
469
470
471
472
473
474
475
476
477
478
479
480
481
482
483
484
485
486
487
488
489
490
491
492
493
494
495
496
497
498
499
500
501
502
503
504
505
506
507
508
509
510
511
512
513
514
515
516
517
518
519
520
521
522
523
524
525
526
527
528
529
530
531
532
533
534
535
536
537
538
539
540
541
542
543
544
545
546
547
548
549
550
551
552
553
554
555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
577
578
579
580
581
582
583
584
585
586
587
588
589
590
591
592
593
594
595
596
597
598
599
600
601
602
603
604
605
606
607
608
609
610
611
612
613
614
615
616
617
618
619
620
621
622
623
624
625
626
627
628
629
630
631
632
633
634
635
636
637
638
639
640
641
642
643
644
645
646
647
648
649
650
651
652
653
654
655
656
657
658
659
660
661
662
663
664
665
666
667
668
669
670
671
672
673
674
675
676
677
678
679
680
681
682
683
684
685
686
687
688
689
690
691
692
693
694
695
696
697
698
699
700
701
702
703
704
705
706
707
708
709
710
711
712
713
714
715
716
717
718
719
720
721
722
723
724
725
726
727
728
729
730
731
732
733
734
735
736
737
738
739
740
741
742
743
744
745
746
747
748
749
750
751
752
753
754
755
756
757
758
759
760
761
762
763
764
765
766
767
768
769
770
771
772
773
774
775
776
777
778
779
780
781
782
783
784
785
786
787
788
789
790
791
792
793
794
795
796
797
798
799
800
801
802
803
804
805
806
807
808
809
810
811
812
813
814
815
816
817
818
819
820
821
822
823
824
825
826
827
828
829
830
831
832
833
834
835
836
837
838
839
840
841
842
843
844
845
846
847
848
849
850
851
852
853
854
855
856
857
858
859
860
861
862
863
864
865
866
867
868
869
870
871
872
873
874
875
876
877
878
879
880
881
882
883
884
885
886
887
888
889
890
891
892
893
894
895
896
897
898
899
900
901
902
903
904
905
906
907
908
909
910
911
912
913
914
915
916
917
918
919
920
921
922
923
924
925
926
927
928
929
930
931
932
933
934
935
936
937
938
939
940
941
942
943
944
945
946
947
948
949
950
951
952
953
954
955
956
957
958
959
960
961
962
963
964
965
966
967
968
969
970
971
972
973
//! Skovgaard's modified directed likelihood root `r*` for a **scalar** interest
//! parameter (issue #939, deliverable 3).
//!
//! For a scalar functional `ψ = cᵀβ` tested against `ψ₀` (e.g. "is the smooth
//! zero at `x₀`", a point-on-curve or a contrast), the first-order signed root
//! of the (profile) likelihood-ratio statistic
//!
//! ```text
//! r = sign(ψ̂ − ψ₀) · √( 2 [ ℓ(ψ̂) − ℓ(ψ₀) ] )
//! ```
//!
//! is `N(0,1)` only to `O(n⁻¹ᐟ²)`. **Barndorff-Nielsen's modified root**
//!
//! ```text
//! r* = r + (1/r) · log( u / r )
//! ```
//!
//! is `N(0,1)` to `O(n⁻³ᐟ²)` — third-order accurate. The hard ingredient is the
//! Skovgaard (1996) sample-space-derivative approximation to `u`. For a scalar
//! interest parameter this assembles entirely from quantities the engine already
//! maintains: the **observed** information `ĵ` (the penalized Hessian / true
//! second derivative at the optimum), the **expected** information `î` (the
//! Fisher weights every family computes for PIRLS), and the score covariance
//! (the per-row score outer product). No new theory and no sample-space
//! quadrature are needed — it is assembly, per the issue's Stage-1 plan.
//!
//! # The scalar Skovgaard `u`
//!
//! For a scalar parameter with no nuisance, Barndorff-Nielsen's exact `u` is the
//! **sample-space derivative** of the log-likelihood, normalised by the observed
//! information at the MLE:
//!
//! ```text
//! u = ĵ^{-1/2} · { ℓ_{;θ̂}(θ̂) − ℓ_{;θ̂}(θ₀) },     ĵ = −ℓ''(θ̂).
//! ```
//!
//! The sample-space derivative `ℓ_{;θ̂}` is generally intractable (it needs an
//! ancillary). **Skovgaard's (1996) approximation** replaces that derivative
//! difference with a covariance of likelihood quantities computed under the
//! fitted model (Skovgaard 1996, *Bernoulli* 2:145–165; Severini, *Likelihood
//! Methods in Statistics*, 2000, §7.5):
//!
//! ```text
//! ℓ_{;θ̂}(θ̂) − ℓ_{;θ̂}(θ₀)  ≈  q̃ := cov_θ̂[ U(θ̂), ℓ(θ̂) − ℓ(θ₀) ],
//! ```
//!
//! which is **exact** for a full exponential family and `O(n⁻¹)`-accurate in
//! general. Expanding `q̃` about the MLE, its leading term is
//! `q̃ ≈ (θ̂ − θ₀) · var_θ̂[U(θ̂)]`, and `var[U]` is precisely the information
//! the model supplies. Writing the score `U(θ) = ℓ'(θ) = Σᵢ s_i(θ)`,
//!
//! * `ĵ = −ℓ''(θ̂)` — the **observed** information at the MLE (the penalized
//!   Hessian; the Barndorff-Nielsen normaliser `ĵ^{-1/2}`),
//! * `î = E[−ℓ''] = var[U]` — the **expected** (Fisher) information (the Fisher
//!   weights every family computes for PIRLS; the score variance that enters
//!   `q̃`),
//! * `Î` — the empirical **score (outer-product) covariance** information, the
//!   data-based (robust / sandwich) estimate of the same `var[U]`; for a single
//!   scalar score it is `Σᵢ s_i(θ̂)²`, and for a functional `ψ = cᵀβ` it is the
//!   sandwich reduction `(cᵀ Ĥ⁻¹ (Σᵢ sᵢsᵢᵀ) Ĥ⁻¹ c)⁻¹`.
//!
//! The scalar Skovgaard statistic is therefore
//!
//! ```text
//! u = (θ̂ − θ₀) · î / √ĵ           (model / Fisher form, the primary r*),
//! ```
//!
//! the observed-information Wald root `(θ̂ − θ₀)√ĵ` rescaled by the
//! **expected/observed information ratio `î/ĵ`** — the curvature correction that
//! the first-order root ignores. For a **canonical** link `î = ĵ` and the factor
//! is `1`; for a **non-canonical** link `î ≠ ĵ` and the correction is genuinely
//! applied (this is the whole point — it is silently lost if `î` is dropped).
//! Replacing the model variance `î` by its empirical estimate `Î` gives the
//! **Severini empirical** companion `u_emp = (θ̂ − θ₀) · Î / √ĵ`; the two agree
//! to `O(n⁻¹)` under correct specification and diverge under misspecification, so
//! reporting both is a model-adequacy diagnostic. In the regular case
//! `î = ĵ = Î`, both collapse to `u = (θ̂ − θ₀)√ĵ → r`, so `r* → r`.
//!
//! # Certification anchor
//!
//! The unit-rate / general-rate **Exponential** model has every ingredient in
//! closed form, so `r*` is checkable against a direct evaluation: `y_i ~ Exp(θ)`,
//! `ℓ(θ) = n log θ − θ Σy`, `θ̂ = n / Σy`, `ĵ = n/θ̂²`, `î = n/θ²`, and the
//! score covariance `Î = n/θ²` at the true `θ`. Because the family is canonical
//! `î = ĵ = Î` and `u` reduces to `(θ̂ − θ₀)√ĵ`; the fixture verifies `r*`
//! moves the directed root toward its `N(0,1)` calibration and reduces to `r`
//! in the large-`n` limit. The **non-canonical** companion fixture
//! (`non_canonical_link_expected_info_enters_u`) pins `î ≠ ĵ` and asserts the
//! `î/ĵ` factor changes `u` — the regression guard for this module.

/// The ingredients of the scalar Skovgaard `r*`, all evaluated for a single
/// scalar interest parameter `θ` (the functional `ψ = cᵀβ` after profiling out
/// the nuisance coefficients).
///
/// Every field is a quantity the fitted model already exposes; this struct is a
/// pure data carrier so the assembly is testable in isolation against the
/// closed-form fixtures.
#[derive(Debug, Clone, Copy)]
pub struct ScalarSkovgaardInput {
    /// The interest parameter estimate `θ̂` (e.g. `ψ̂ = cᵀβ̂`).
    pub theta_hat: f64,
    /// The tested null value `θ₀` (e.g. `ψ₀`, often `0` for "smooth is zero").
    pub theta_null: f64,
    /// The profile log-likelihood-ratio statistic
    /// `W = 2[ℓ(θ̂) − ℓ(θ₀)] ≥ 0` (from a constrained refit at `cᵀβ = θ₀`).
    pub lr_statistic: f64,
    /// Observed information `ĵ` for the interest parameter at the optimum: the
    /// scalar reduction `(cᵀ Ĥ⁻¹ c)⁻¹` of the penalized Hessian `Ĥ`, i.e. the
    /// inverse of the profile variance of `θ̂`.
    pub observed_info: f64,
    /// Expected (Fisher) information `î` for the interest parameter — the same
    /// reduction using the Fisher-weight information `Iₑ` the family supplies to
    /// PIRLS: `(cᵀ Iₑ⁻¹ c)⁻¹`.
    pub expected_info: f64,
    /// Score (outer-product) covariance `Î` for the interest parameter: the
    /// reduction `(cᵀ Ĥ⁻¹ (Σᵢ sᵢsᵢᵀ) Ĥ⁻¹ c)` evaluated with the per-row score
    /// contributions `sᵢ = ∂ℓᵢ/∂β`, inverted to the parameter scale. The
    /// "robust"/empirical information.
    pub score_cov: f64,
}

/// The Skovgaard `r*` report for a scalar test.
#[derive(Debug, Clone, Copy)]
pub struct ScalarSkovgaardResult {
    /// The first-order directed likelihood root `r = sign(θ̂−θ₀)·√W`.
    pub r: f64,
    /// Skovgaard's `u` quantity, model/Fisher form `u = (θ̂−θ₀)·î/√ĵ`.
    pub u: f64,
    /// The modified directed root `r* = r + log(u/r)/r` (model/Fisher form).
    pub r_star: f64,
    /// First-order two-sided p-value `2·Φ(−|r|)`.
    pub p_value_first_order: f64,
    /// Third-order two-sided p-value `2·Φ(−|r*|)` (model/Fisher form).
    pub p_value_corrected: f64,
    /// The Severini empirical companion `u_emp = (θ̂−θ₀)·Î/√ĵ`, using the
    /// empirical score covariance `Î` in place of the model Fisher information
    /// `î`. Equals [`Self::u`] when `î = Î`.
    pub u_empirical: f64,
    /// The empirical modified root `r* = r + log(u_emp/r)/r`. Falls back to `r`
    /// when the empirical log-domain guard fails, exactly as the model form.
    pub r_star_empirical: f64,
    /// Two-sided p-value `2·Φ(−|r*_emp|)` of the empirical companion.
    pub p_value_corrected_empirical: f64,
    /// Whether the `r*` correction is **material** (>10% relative change in the
    /// p-value, or `|r* − r| > 0.1·|r|`): the per-test diagnostic that the
    /// sample is too small for first-order inference here (#939 deliverable 4).
    pub material: bool,
}

/// Standard normal CDF `Φ`.
fn normal_cdf(z: f64) -> f64 {
    0.5 * statrs::function::erf::erfc(-z / std::f64::consts::SQRT_2)
}

/// Two-sided normal-tail p-value `2·Φ(−|z|)`.
fn two_sided_p(z: f64) -> f64 {
    (2.0 * normal_cdf(-z.abs())).clamp(0.0, 1.0)
}

/// The materiality threshold (#939 deliverable 4): a correction is material when
/// it moves the result by more than 10%.
pub const SKOVGAARD_MATERIAL_THRESHOLD: f64 = 0.10;

/// Assemble the scalar Skovgaard `r*` from its ingredients.
///
/// Returns `None` when the inputs are degenerate: a non-positive LR statistic
/// (the directed root is undefined at `r = 0`), a non-finite or non-positive
/// information, or a non-finite `r*` (e.g. `u/r ≤ 0`, where the third-order
/// formula does not apply and the first-order root stands). The caller then
/// reports the first-order `r` only — the correction is never forced.
pub fn scalar_skovgaard_r_star(input: &ScalarSkovgaardInput) -> Option<ScalarSkovgaardResult> {
    let ScalarSkovgaardInput {
        theta_hat,
        theta_null,
        lr_statistic,
        observed_info,
        expected_info,
        score_cov,
    } = *input;

    if !(lr_statistic.is_finite() && lr_statistic > 0.0) {
        return None;
    }
    if !(observed_info.is_finite() && observed_info > 0.0) {
        return None;
    }
    if !(expected_info.is_finite() && expected_info > 0.0) {
        return None;
    }
    if !(score_cov.is_finite() && score_cov > 0.0) {
        return None;
    }
    if !(theta_hat.is_finite() && theta_null.is_finite()) {
        return None;
    }

    // θ̂ = θ₀ ⇒ the directed root is exactly `r = 0`: no side, no correction.
    // NOTE: `f64::signum` returns `±1.0` even for `±0.0` (it never returns `0.0`),
    // so the equality case MUST be detected directly from `θ̂ − θ₀ == 0` rather
    // than from `sign == 0.0` — the latter is unreachable and would let an
    // on-the-null input fall through to `r = √W ≠ 0`.
    if theta_hat == theta_null {
        return Some(ScalarSkovgaardResult {
            r: 0.0,
            u: 0.0,
            r_star: 0.0,
            p_value_first_order: 1.0,
            p_value_corrected: 1.0,
            u_empirical: 0.0,
            r_star_empirical: 0.0,
            p_value_corrected_empirical: 1.0,
            material: false,
        });
    }
    // First-order directed root: sign from the estimate's side of the null, mag
    // from the LR statistic. `θ̂ ≠ θ₀` here, so `sign ∈ {−1, +1}`.
    let sign = (theta_hat - theta_null).signum();
    let p_first = two_sided_p(sign * lr_statistic.sqrt());
    let r = sign * lr_statistic.sqrt();

    // Barndorff-Nielsen's `u = ĵ^{-1/2}·{SSD}` with Skovgaard's covariance
    // approximation to the sample-space-derivative difference (see the module
    // header): `SSD ≈ q̃ ≈ (θ̂−θ₀)·var[U]`, so the score-variance information
    // `var[U]` enters the numerator and the observed information `ĵ` is the
    // Barndorff-Nielsen normaliser `ĵ^{-1/2}`:
    //
    //   u     = (θ̂ − θ₀) · î / √ĵ      (model / Fisher var[U] = î)
    //   u_emp = (θ̂ − θ₀) · Î / √ĵ      (Severini empirical var[U] = Î).
    //
    // The expected/observed ratio `î/ĵ` is the curvature correction that the
    // first-order root drops; it is `1` for a canonical link and `≠ 1` for a
    // non-canonical one. In the regular case `î = ĵ = Î` both collapse to
    // `(θ̂ − θ₀)√ĵ → r`.
    let dtheta = theta_hat - theta_null;
    let sqrt_obs = observed_info.sqrt();
    let u = dtheta * expected_info / sqrt_obs;
    let u_empirical = dtheta * score_cov / sqrt_obs;

    // Barndorff-Nielsen modification `r* = r + log(u/r)/r`, guarding the
    // log-domain (`u` and `r` must share a sign and `u/r > 0`): when the
    // third-order formula does not apply the first-order root stands.
    let modified_root = |u_val: f64| -> f64 {
        let ratio = u_val / r;
        if !(ratio.is_finite() && ratio > 0.0) {
            return r;
        }
        let rs = r + ratio.ln() / r;
        if rs.is_finite() { rs } else { r }
    };
    let r_star = modified_root(u);
    let r_star_empirical = modified_root(u_empirical);

    let p_corr = two_sided_p(r_star);
    let p_corr_empirical = two_sided_p(r_star_empirical);
    let p_denom = p_first.max(p_corr).max(f64::MIN_POSITIVE);
    let p_move = (p_corr - p_first).abs() / p_denom;
    let r_move = (r_star - r).abs() / r.abs().max(f64::MIN_POSITIVE);
    let material = p_move > SKOVGAARD_MATERIAL_THRESHOLD || r_move > SKOVGAARD_MATERIAL_THRESHOLD;

    Some(ScalarSkovgaardResult {
        r,
        u,
        r_star,
        p_value_first_order: p_first,
        p_value_corrected: p_corr,
        u_empirical,
        r_star_empirical,
        p_value_corrected_empirical: p_corr_empirical,
        material,
    })
}

/// Assemble [`ScalarSkovgaardInput`] for a scalar functional `ψ = cᵀβ` from the
/// matrix-level ingredients a fitted penalized GLM exposes, then compute `r*`.
///
/// * `contrast` (`c`) — the functional gradient `∂ψ/∂β`: a design row for a
///   point-on-curve `m(x₀)`, the difference of two rows for a contrast, or any
///   linear functional gradient.
/// * `beta` — fitted coefficients `β̂`.
/// * `penalized_hessian` (`Ĥ = X'WX + S_λ`) — the **observed** information in
///   coefficient space (the engine's penalized Hessian / true second
///   derivative).
/// * `fisher_information` (`Iₑ = X'WX`) — the **expected** (Fisher) information
///   in coefficient space (the PIRLS Fisher weights; pass `None` to reuse the
///   penalized Hessian when the family is canonical and the distinction
///   vanishes).
/// * `row_scores` (`sᵢ = ∂ℓᵢ/∂β`, `n × p`) — per-row score contributions for the
///   score (outer-product) covariance `Σᵢ sᵢsᵢᵀ`.
/// * `lr_statistic` (`W = 2[ℓ(β̂) − ℓ(β̂₀)]`) — the profile likelihood-ratio
///   statistic from a constrained refit at `cᵀβ = θ₀` (caller-supplied; the
///   constrained-fit machinery lives in the KKT path).
/// * `theta_null` (`θ₀`) — the tested value (commonly `0`).
///
/// The scalar reductions are the standard profile/marginal identities:
/// `observed_info = (cᵀ Ĥ⁻¹ c)⁻¹`, `expected_info = (cᵀ Iₑ⁻¹ c)⁻¹`, and
/// `score_cov = (cᵀ Ĥ⁻¹ (Σ sᵢsᵢᵀ) Ĥ⁻¹ c)⁻¹` — the inverse of the sandwich
/// (robust) variance of `ψ̂`. Returns `None` on any degenerate reduction.
pub fn scalar_skovgaard_from_matrices(
    contrast: ndarray::ArrayView1<'_, f64>,
    beta: ndarray::ArrayView1<'_, f64>,
    penalized_hessian: ndarray::ArrayView2<'_, f64>,
    fisher_information: Option<ndarray::ArrayView2<'_, f64>>,
    row_scores: ndarray::ArrayView2<'_, f64>,
    lr_statistic: f64,
    theta_null: f64,
) -> Option<ScalarSkovgaardResult> {
    use crate::faer_ndarray::FaerCholesky;
    use faer::Side;

    let p = beta.len();
    if p == 0
        || contrast.len() != p
        || penalized_hessian.nrows() != p
        || penalized_hessian.ncols() != p
        || row_scores.ncols() != p
    {
        return None;
    }
    if contrast.iter().any(|v| !v.is_finite()) || beta.iter().any(|v| !v.is_finite()) {
        return None;
    }

    let theta_hat = contrast.dot(&beta);

    // Ĥ⁻¹ c via the penalized-Hessian Cholesky.
    let h_obs = penalized_hessian.to_owned();
    let chol_obs = h_obs.cholesky(Side::Lower).ok()?;
    let c_owned = contrast.to_owned();
    let hinv_c = chol_obs.solvevec(&c_owned);
    if hinv_c.iter().any(|v| !v.is_finite()) {
        return None;
    }
    // Profile variance of ψ̂ under the penalized fit: cᵀ Ĥ⁻¹ c. Observed info is
    // its inverse.
    let var_obs = contrast.dot(&hinv_c);
    if !(var_obs.is_finite() && var_obs > 0.0) {
        return None;
    }
    let observed_info = 1.0 / var_obs;

    // Expected info: same reduction with the Fisher information; default to the
    // penalized Hessian when the family/link is canonical (no distinction).
    let expected_info = match fisher_information {
        Some(fisher) => {
            if fisher.nrows() != p || fisher.ncols() != p {
                return None;
            }
            let f_owned = fisher.to_owned();
            let chol_f = f_owned.cholesky(Side::Lower).ok()?;
            let finv_c = chol_f.solvevec(&c_owned);
            let var_exp = contrast.dot(&finv_c);
            if !(var_exp.is_finite() && var_exp > 0.0) {
                return None;
            }
            1.0 / var_exp
        }
        None => observed_info,
    };

    // Score (outer-product) covariance in parameter space: the sandwich variance
    // cᵀ Ĥ⁻¹ (Σ sᵢsᵢᵀ) Ĥ⁻¹ c, inverted. With a = Ĥ⁻¹ c this is Σᵢ (sᵢᵀ a)².
    let mut sandwich = 0.0;
    for srow in row_scores.rows() {
        if srow.iter().any(|v| !v.is_finite()) {
            return None;
        }
        let proj = srow.dot(&hinv_c);
        sandwich += proj * proj;
    }
    if !(sandwich.is_finite() && sandwich > 0.0) {
        return None;
    }
    let score_cov = 1.0 / sandwich;

    scalar_skovgaard_r_star(&ScalarSkovgaardInput {
        theta_hat,
        theta_null,
        lr_statistic,
        observed_info,
        expected_info,
        score_cov,
    })
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn regular_case_collapses_to_first_order() {
        // î = ĵ = Î (regular, large-n limit): u = (θ̂−θ₀)·î/√ĵ = (θ̂−θ₀)√ĵ ≈ r,
        // so r* = r. Take a model with info = 100, θ̂−θ₀ = 0.3 ⇒ Wald² = 9, and
        // the LR statistic equals the Wald square to leading order.
        let info = 100.0;
        let dtheta = 0.3;
        let lr = dtheta * dtheta * info; // 9.0
        let res = scalar_skovgaard_r_star(&ScalarSkovgaardInput {
            theta_hat: 0.3,
            theta_null: 0.0,
            lr_statistic: lr,
            observed_info: info,
            expected_info: info,
            score_cov: info,
        })
        .expect("r*");
        // r = +3, u = (0.3)·100/10 = 3, ratio = 1, log(1)/3 = 0 ⇒ r* = r.
        assert!((res.r - 3.0).abs() < 1e-12, "r = {}", res.r);
        assert!((res.u - 3.0).abs() < 1e-12, "u = {}", res.u);
        assert!((res.r_star - res.r).abs() < 1e-12, "r* = {}", res.r_star);
        // The empirical companion uses the same î = ĵ = Î ⇒ identical to u.
        assert!(
            (res.u_empirical - res.u).abs() < 1e-12,
            "u_emp = {}",
            res.u_empirical
        );
        assert!((res.r_star_empirical - res.r_star).abs() < 1e-12);
        assert!(!res.material, "regular case must not be material");
    }

    #[test]
    fn expected_observed_ratio_shifts_r_star_and_p() {
        // The whole point of the fix: the expected/observed information ratio
        // î/ĵ drives u. With î > ĵ (expected information larger than observed —
        // a non-canonical-link signature), u > r and r* > r (a larger root,
        // smaller p-value). The empirical companion uses Î independently.
        let dtheta = 0.2;
        let observed = 100.0; // ĵ
        let expected = 196.0; // î > ĵ ⇒ î/ĵ = 1.96 correction
        let score_cov = 121.0; // Î (drives the empirical companion only)
        let lr = dtheta * dtheta * observed; // 4.0, r = 2.0
        let res = scalar_skovgaard_r_star(&ScalarSkovgaardInput {
            theta_hat: 0.2,
            theta_null: 0.0,
            lr_statistic: lr,
            observed_info: observed,
            expected_info: expected,
            score_cov,
        })
        .expect("r*");
        assert!((res.r - 2.0).abs() < 1e-12);
        // u = 0.2·196/√100 = 3.92, ratio = 1.96, r* = 2 + ln(1.96)/2.
        let expected_u = dtheta * expected / observed.sqrt();
        assert!((res.u - expected_u).abs() < 1e-12, "u = {}", res.u);
        assert!(
            (res.r_star - 2.336_472_236_6).abs() < 1e-9,
            "r* = {}",
            res.r_star
        );
        assert!(res.r_star > res.r, "î > ĵ must lift r*");
        assert!(
            res.p_value_corrected < res.p_value_first_order,
            "larger root ⇒ smaller two-sided p"
        );
        assert!(
            res.material,
            "96% information discrepancy must flag material"
        );
        // Empirical companion: u_emp = 0.2·121/10 = 2.42, independent of î.
        assert!((res.u_empirical - dtheta * score_cov / observed.sqrt()).abs() < 1e-12);
        assert!((res.r_star_empirical - 2.095_310_179_8).abs() < 1e-9);
    }

    /// CONJUGATE FIXTURE (Exponential rate, scalar): every Skovgaard ingredient
    /// is closed form. `yᵢ ~ Exp(θ)`, `ℓ(θ) = n log θ − θ Σy`,
    /// `θ̂ = n/Σy`. At the data-generating `θ = 1` with `n` rows and the MLE
    /// `θ̂`, the observed and expected informations are `n/θ̂²` and `n/θ²`, and
    /// the score covariance at `θ̂` is `n/θ̂²` (the score variance equals the
    /// observed information for this canonical family). The directed root, `u`,
    /// and `r*` are then exactly computable; the test asserts the formula
    /// reproduces them and that `r*` is closer to its normal calibration than
    /// the skewed first-order `r`.
    #[test]
    fn exponential_rate_scalar_skovgaard_closed_form() {
        // Fix a concrete sufficient statistic: n = 25 rows, Σy = 20 ⇒ θ̂ = 1.25,
        // test θ₀ = 1.0.
        let n = 25.0_f64;
        let sum_y = 20.0_f64;
        let theta_hat = n / sum_y; // 1.25
        let theta0 = 1.0_f64;
        // ℓ(θ) = n ln θ − θ Σy.
        let ll = |t: f64| n * t.ln() - t * sum_y;
        let lr = (2.0 * (ll(theta_hat) - ll(theta0))).max(0.0);
        // Observed info at θ̂: −ℓ''(θ) = n/θ². ĵ = n/θ̂².
        let observed = n / (theta_hat * theta_hat);
        // Expected info at θ̂ (Fisher) = n/θ̂² for this family at the MLE.
        let expected = n / (theta_hat * theta_hat);
        // Score covariance at θ̂: var(ℓ') = n/θ̂² (the canonical identity).
        let score_cov = n / (theta_hat * theta_hat);
        let res = scalar_skovgaard_r_star(&ScalarSkovgaardInput {
            theta_hat,
            theta_null: theta0,
            lr_statistic: lr,
            observed_info: observed,
            expected_info: expected,
            score_cov,
        })
        .expect("r*");
        // Closed-form directed root.
        let r_expected = (theta_hat - theta0).signum() * lr.sqrt();
        assert!((res.r - r_expected).abs() < 1e-12, "r = {}", res.r);
        // u = (θ̂−θ₀)·î/√ĵ; here î = ĵ so u = (θ̂−θ₀)·√ĵ.
        let u_expected = (theta_hat - theta0) * expected / observed.sqrt();
        assert!((res.u - u_expected).abs() < 1e-12, "u = {}", res.u);
        // Canonical family ⇒ the empirical companion coincides with the model u.
        assert!(
            (res.u_empirical - res.u).abs() < 1e-12,
            "u_emp = {}",
            res.u_empirical
        );
        // r* finite and on the same side as r.
        assert!(res.r_star.is_finite());
        assert!(res.r_star.signum() == res.r.signum());
        // Canonical identity: u = q = (θ̂−θ₀)√ĵ, the Wald root (î = ĵ here). For
        // the right-skewed exponential LR the directed root r overstates the
        // Wald root, and the higher-order r* lies strictly between the Wald root
        // and r — the refinement that pulls the skewed first-order root back.
        let q = (theta_hat - theta0) * observed.sqrt();
        assert!(
            (res.u - q).abs() < 1e-12,
            "u = {} should equal Wald root q = {q}",
            res.u
        );
        assert!(
            q < res.r_star && res.r_star < r_expected,
            "need q < r* < r: q={q} r*={} r={r_expected}",
            res.r_star
        );
        // Both p-values are valid probabilities, the corrected one finite.
        assert!((0.0..=1.0).contains(&res.p_value_first_order));
        assert!((0.0..=1.0).contains(&res.p_value_corrected));
    }

    #[test]
    fn matrix_assembler_reduces_diagonal_case() {
        use ndarray::{Array2, array};
        // p = 1 (a scalar coefficient β with contrast c = [1]). Penalized
        // Hessian = [[50]], Fisher = [[40]], two score rows summing to a known
        // outer product. β̂ = [0.25], θ₀ = 0.
        let contrast = array![1.0_f64];
        let beta = array![0.25_f64];
        let h = Array2::from_shape_vec((1, 1), vec![50.0]).unwrap();
        let fisher = Array2::from_shape_vec((1, 1), vec![40.0]).unwrap();
        // Two rows with scores 3.0 and 4.0 ⇒ Σ sᵢ² = 25; a = Ĥ⁻¹c = 1/50.
        // sandwich = Σ (sᵢ·a)² = 25/2500 = 0.01 ⇒ score_cov = 100.
        let row_scores = Array2::from_shape_vec((2, 1), vec![3.0, 4.0]).unwrap();
        let lr = 4.0;
        let res = scalar_skovgaard_from_matrices(
            contrast.view(),
            beta.view(),
            h.view(),
            Some(fisher.view()),
            row_scores.view(),
            lr,
            0.0,
        )
        .expect("assembled r*");
        // observed_info ĵ = 1/(cᵀĤ⁻¹c) = 1/(1/50) = 50.
        // expected_info î = 1/(1/40) = 40.
        // score_cov   Î = 1/0.01 = 100.
        // θ̂ = 0.25, r = +√4 = 2.
        assert!((res.r - 2.0).abs() < 1e-12, "r = {}", res.r);
        // u = (θ̂−θ₀)·î/√ĵ = 0.25·40/√50 = √2.
        assert!(
            (res.u - std::f64::consts::SQRT_2).abs() < 1e-9,
            "u = {}",
            res.u
        );
        assert!(
            (res.r_star - 1.826_713_204_9).abs() < 1e-9,
            "r* = {}",
            res.r_star
        );
        // u < r here ⇒ r* < r ⇒ larger two-sided p than first-order.
        assert!(res.p_value_corrected > res.p_value_first_order);
        // Empirical companion: u_emp = (θ̂−θ₀)·Î/√ĵ = 0.25·100/√50 = 3.53553391.
        assert!(
            (res.u_empirical - 3.535_533_905_9).abs() < 1e-9,
            "u_emp = {}",
            res.u_empirical
        );
        assert!((res.r_star_empirical - 2.284_858_570_8).abs() < 1e-9);
        // Dimension mismatch is rejected.
        let bad_c = array![1.0_f64, 0.0];
        assert!(
            scalar_skovgaard_from_matrices(
                bad_c.view(),
                beta.view(),
                h.view(),
                None,
                row_scores.view(),
                lr,
                0.0,
            )
            .is_none()
        );
    }

    /// NON-CANONICAL FIXTURE (logistic location model, scalar): the regression
    /// guard for this module. A logistic location model `yᵢ = θ + εᵢ`,
    /// `εᵢ ~ Logistic(0, 1)`, is **non-canonical** — the observed information
    /// `ĵ = −Σ g''(yᵢ−θ̂) = 2Σ f(yᵢ−θ̂)` is data-dependent and differs from the
    /// expected (Fisher) information `î = n/3`. The exact Barndorff-Nielsen `u`
    /// for a location model is `U(θ₀)/√ĵ`, and `g'(x) = 1 − 2F(x)`,
    /// `g''(x) = −2 f(x)` with `F`, `f` the logistic CDF / PDF.
    ///
    /// The key assertion is that `expected_info` is **load-bearing in `u`**:
    /// forcing `î := ĵ` (the canonical substitution) changes `u`. The pre-fix
    /// formula `u = (θ̂−θ₀)·ĵ/√Î` does not read `expected_info` at all, so it
    /// produces the *same* `u` under that substitution — i.e. this test fails
    /// under the dropped-`î` bug and passes once `î` enters `u = (θ̂−θ₀)·î/√ĵ`.
    #[test]
    fn non_canonical_link_expected_info_enters_u() {
        let cdf = |x: f64| 1.0 / (1.0 + (-x).exp());
        let pdf = |x: f64| {
            let e = (-x).exp();
            e / ((1.0 + e) * (1.0 + e))
        };
        let gp = |x: f64| 1.0 - 2.0 * cdf(x); // g'(x)
        let g = |x: f64| -x - 2.0 * (1.0 + (-x).exp()).ln(); // log pdf

        // Fixed asymmetric dataset so θ̂ is off-centre and ĵ ≠ î.
        let y = [-0.4_f64, 0.1, 0.7, 1.3, 2.1, 2.8, 3.9, 5.5];
        let n = y.len() as f64;
        let score = |t: f64| y.iter().map(|&yi| -gp(yi - t)).sum::<f64>(); // U(θ)
        let obs_info = |t: f64| 2.0 * y.iter().map(|&yi| pdf(yi - t)).sum::<f64>(); // ĵ(t) = −Σg''
        // Newton for the MLE.
        let mut theta_hat = y.iter().sum::<f64>() / n;
        for _ in 0..100 {
            let step = score(theta_hat) / obs_info(theta_hat);
            theta_hat += step;
            if step.abs() < 1e-14 {
                break;
            }
        }
        let theta0 = 1.0_f64;
        let observed = obs_info(theta_hat); // ĵ
        let expected = n / 3.0; // î = n · (logistic Fisher info 1/3)
        // Empirical efficient information for the scalar case (engine reduction
        // with c = 1, a = Ĥ⁻¹c = 1/ĵ): Î = ĵ² / Σ sᵢ².
        let meat = y.iter().map(|&yi| gp(yi - theta_hat).powi(2)).sum::<f64>();
        let score_cov = observed * observed / meat;
        let lr = (2.0
            * (y.iter().map(|&yi| g(yi - theta_hat)).sum::<f64>()
                - y.iter().map(|&yi| g(yi - theta0)).sum::<f64>()))
        .max(0.0);
        assert!(
            expected > observed,
            "fixture must have î > ĵ: î={expected} ĵ={observed}"
        );

        let input = ScalarSkovgaardInput {
            theta_hat,
            theta_null: theta0,
            lr_statistic: lr,
            observed_info: observed,
            expected_info: expected,
            score_cov,
        };
        let res = scalar_skovgaard_r_star(&input).expect("r*");

        // u uses the EXPECTED information: u = (θ̂−θ₀)·î/√ĵ.
        let u_expected = (theta_hat - theta0) * expected / observed.sqrt();
        assert!(
            (res.u - u_expected).abs() < 1e-12,
            "u = {} expected {u_expected}",
            res.u
        );

        // The load-bearing guard: forcing î := ĵ (canonical) changes u. Under the
        // pre-fix u = (θ̂−θ₀)·ĵ/√Î this substitution would leave u unchanged.
        let canonical = scalar_skovgaard_r_star(&ScalarSkovgaardInput {
            expected_info: observed,
            ..input
        })
        .expect("r* canonical");
        assert!(
            (res.u - canonical.u).abs() > 1e-3,
            "expected_info must change u: non-canonical u={} canonical u={}",
            res.u,
            canonical.u
        );
        // Canonical substitution reduces u to the observed-Wald root (θ̂−θ₀)√ĵ.
        assert!(
            (canonical.u - (theta_hat - theta0) * observed.sqrt()).abs() < 1e-12,
            "canonical u must be (θ̂−θ₀)√ĵ, got {}",
            canonical.u
        );
        // The empirical companion is independent of î and tracks Î instead.
        let u_emp_expected = (theta_hat - theta0) * score_cov / observed.sqrt();
        assert!((res.u_empirical - u_emp_expected).abs() < 1e-12);
        assert!(res.r_star.is_finite() && res.r_star_empirical.is_finite());
    }

    #[test]
    fn rejects_degenerate_inputs() {
        let base = ScalarSkovgaardInput {
            theta_hat: 0.3,
            theta_null: 0.0,
            lr_statistic: 4.0,
            observed_info: 50.0,
            expected_info: 50.0,
            score_cov: 50.0,
        };
        // Non-positive LR.
        assert!(
            scalar_skovgaard_r_star(&ScalarSkovgaardInput {
                lr_statistic: 0.0,
                ..base
            })
            .is_none()
        );
        // Non-positive info.
        assert!(
            scalar_skovgaard_r_star(&ScalarSkovgaardInput {
                observed_info: 0.0,
                ..base
            })
            .is_none()
        );
        assert!(
            scalar_skovgaard_r_star(&ScalarSkovgaardInput {
                score_cov: -1.0,
                ..base
            })
            .is_none()
        );
        // θ̂ = θ₀ ⇒ r = 0, p = 1, not material.
        let eq = scalar_skovgaard_r_star(&ScalarSkovgaardInput {
            theta_hat: 0.0,
            ..base
        })
        .expect("equal");
        assert_eq!(eq.r, 0.0);
        assert_eq!(eq.p_value_first_order, 1.0);
        assert!(!eq.material);
    }

    // ── INDEPENDENT ANALYTIC FIXTURE: Poisson mean via the Lugannani–Rice
    //    saddlepoint (#939, deliverable 3 hardening) ───────────────────────────
    //
    // A second, algebraically-distinct closed form for `r*`. For a one-parameter
    // exponential family the modified root `r*` and the Lugannani–Rice (1980)
    // saddlepoint approximation share the SAME directed root `r` and the SAME `u`,
    // but combine them by different formulas:
    //
    //   * Barndorff-Nielsen:  r* = r + (1/r)·log(u/r),  tail = Φ(−r*),
    //   * Lugannani–Rice:     tail = 1 − Φ(r) − φ(r)·(1/r − 1/u).
    //
    // Both are third-order-accurate approximations to the SAME exact tail
    // probability, so they must agree to O(n⁻³ᐟ²). Reproducing the L–R tail from
    // OUR `(r, u)` is therefore an independent check that the engine's `u` (built
    // from observed/expected/score information) is the genuine Skovgaard `u` — a
    // different derivation than the Exponential/canonical anchor already in the
    // module, on a different family.
    //
    // Poisson model: `S ~ Poisson(nμ)`, canonical θ = log μ. For the natural
    // sufficient statistic the canonical-family `u` equals the Wald root
    // `q = (θ̂−θ₀)·√ĵ` with `ĵ = nμ̂ = S` (the exact observed information in θ),
    // and the LR root is `r = sign(θ̂−θ₀)·√W`, `W = 2[S log(S/(nμ₀)) − (S−nμ₀)]`.

    /// Standard normal pdf.
    fn normal_pdf(z: f64) -> f64 {
        (-0.5 * z * z).exp() / (2.0 * std::f64::consts::PI).sqrt()
    }

    /// The right-tail `P(X ≥ x)` for the Poisson saddlepoint problem, computed two
    /// independent ways from a single `(r, u)`: our Barndorff-Nielsen `r*` tail and
    /// the Lugannani–Rice tail. Returns `(p_rstar, p_lr, p_first_order)`.
    fn poisson_tails(n: f64, mu_hat: f64, mu0: f64) -> (f64, f64, f64) {
        let theta_hat = mu_hat.ln();
        let theta0 = mu0.ln();
        let s = n * mu_hat; // sufficient statistic S = nμ̂
        // LR statistic W = 2[S log(S/(nμ₀)) − (S − nμ₀)].
        let w = 2.0 * (s * (s / (n * mu0)).ln() - (s - n * mu0));
        // AT-THE-NULL atom (`μ̂ = μ₀` ⇒ `θ̂ = θ₀`, `W = 0`): the directed root is
        // exactly `r = 0`, `r*` is undefined, and the right-tail probability is
        // exactly `½` for all three forms. `scalar_skovgaard_r_star` correctly
        // returns `None` on a zero LR (the degenerate-input contract), so handle
        // this lattice atom here rather than unwrapping a `None`. For n=10, μ₀=1.3
        // the integer `s = 13` lands exactly on the null, so this branch is live.
        if theta_hat == theta0 || !(w > 0.0) {
            return (0.5, 0.5, 0.5);
        }
        // Observed/expected/score info in θ all equal nμ̂ = S for the canonical
        // Poisson at the MLE — the canonical identity î = ĵ = Î.
        let info = s;
        let res = scalar_skovgaard_r_star(&ScalarSkovgaardInput {
            theta_hat,
            theta_null: theta0,
            lr_statistic: w,
            observed_info: info,
            expected_info: info,
            score_cov: info,
        })
        .expect("poisson r*");
        let r = res.r;
        let u = res.u; // canonical ⇒ u = (θ̂−θ₀)√ĵ, the Wald root
        // Our r* right-tail P(X ≥ x) = Φ(−r*) = 1 − Φ(r*).
        let p_rstar = 1.0 - normal_cdf(res.r_star);
        // Lugannani–Rice tail from the same (r, u).
        let p_lr = (1.0 - normal_cdf(r)) - normal_pdf(r) * (1.0 / r - 1.0 / u);
        let p_first = 1.0 - normal_cdf(r);
        (p_rstar, p_lr, p_first)
    }

    #[test]
    fn poisson_r_star_tail_matches_lugannani_rice_saddlepoint() {
        // A genuine upper-tail event: μ̂ above μ₀ so r, u > 0 and the tail is small.
        // Several (n, μ̂, μ₀) so the agreement is not a single coincidence.
        for &(n, mu_hat, mu0) in &[
            (12.0_f64, 1.6_f64, 1.0_f64),
            (20.0, 2.3, 1.7),
            (8.0, 3.1, 2.0),
            (30.0, 0.9, 0.6),
        ] {
            let (p_rstar, p_lr, p_first) = poisson_tails(n, mu_hat, mu0);
            // Both saddlepoint tails are valid probabilities.
            assert!(
                (0.0..=1.0).contains(&p_rstar) && (0.0..=1.0).contains(&p_lr),
                "n={n} μ̂={mu_hat}: tails must be probabilities (r*={p_rstar}, LR={p_lr})"
            );
            // INDEPENDENT AGREEMENT: r* and Lugannani–Rice must coincide to the
            // shared O(n⁻³ᐟ²) order. Their relative gap shrinks with n; at these
            // modest n a 5% relative band (and a tight absolute floor) holds.
            let rel = (p_rstar - p_lr).abs() / p_lr.max(1e-12);
            assert!(
                (p_rstar - p_lr).abs() < 5e-3 || rel < 0.05,
                "n={n} μ̂={mu_hat} μ₀={mu0}: r* tail {p_rstar:.6} must match \
                 Lugannani–Rice {p_lr:.6} (|Δ|={:.2e}, rel={rel:.3})",
                (p_rstar - p_lr).abs()
            );
            // And both higher-order tails must DIFFER from the raw first-order
            // directed-root tail — otherwise the correction is a no-op and the
            // agreement above would be vacuous.
            assert!(
                (p_rstar - p_first).abs() > 1e-4,
                "n={n} μ̂={mu_hat}: r* must move the tail off the first-order value \
                 (r*={p_rstar:.6}, first-order={p_first:.6})"
            );
        }
    }

    /// SMALL-n SIZE CHECK (#939, deliverable 3 hardening): under the null the
    /// one-sided p-value from the modified root `r*` must be BETTER calibrated
    /// (closer to Uniform / nominal size) than the raw first-order directed root
    /// `r`. Exact null distribution: `S ~ Poisson(nμ₀)` summed over the integer
    /// support — no Monte-Carlo noise, the size is computed exactly from the pmf.
    #[test]
    fn poisson_r_star_improves_small_n_size_over_first_order() {
        let mu0 = 1.3_f64;
        // Two complementary calibration metrics, accumulated across all n:
        //   (1) the DISCRETE exact rejection size at fixed α — coarse, because a
        //       Poisson statistic rejects at whole atoms, so r* and the
        //       first-order root can tie when their p-values straddle the same
        //       atom (a no-op at that α/n, never an improvement). We require r*
        //       to be NO WORSE at every (n, α) and strictly better in aggregate.
        //   (2) accuracy against the EXACT Poisson upper-tail probability
        //       P(S′ ≥ s) (ground truth, summed from the same pmf): the
        //       third-order r* tail must be a strictly better approximation to
        //       the exact tail than the first-order root, in pmf-weighted mean
        //       absolute error over the upper half. This is not quantized by the
        //       rejection grid, so it is the un-aliased witness that r* genuinely
        //       sharpens the tail.
        let alphas = [0.05_f64, 0.10];
        let mut total_err_first = 0.0_f64;
        let mut total_err_star = 0.0_f64;
        let mut total_mae_first = 0.0_f64;
        let mut total_mae_star = 0.0_f64;
        // Small n where the first-order directed root is visibly skewed.
        for &n in &[10.0_f64, 16.0, 25.0] {
            let rate = n * mu0; // S ~ Poisson(rate)
            let s_max = (rate + 50.0 * rate.sqrt()).ceil() as usize;
            // Materialize the exact pmf so we can form the exact upper tail.
            let mut pmf_vec = vec![0.0_f64; s_max + 1];
            let mut pmf = (-rate).exp();
            pmf_vec[0] = pmf;
            for s in 1..=s_max {
                pmf *= rate / s as f64;
                pmf_vec[s] = pmf;
            }
            // Exact upper tail P(S′ ≥ s) = Σ_{t≥s} pmf(t).
            let mut exact_upper = vec![0.0_f64; s_max + 2];
            for s in (0..=s_max).rev() {
                exact_upper[s] = exact_upper[s + 1] + pmf_vec[s];
            }
            let mut size_first = [0.0_f64; 2];
            let mut size_star = [0.0_f64; 2];
            // pmf-weighted mean |approx tail − exact tail| over the upper half.
            let mut tail_err_first = 0.0_f64;
            let mut tail_err_star = 0.0_f64;
            let mut mass_upper = 0.0_f64;
            for s in 1..=s_max {
                let p = pmf_vec[s];
                let mu_hat = s as f64 / n;
                // Upper-tail p-values (one-sided test μ > μ₀). For μ̂ < μ₀ the
                // upper-tail p-value is > 0.5 and never triggers a small-α
                // rejection, so this cleanly isolates the calibrated tail.
                let (p_rstar, _p_lr, p_first) = poisson_tails(n, mu_hat, mu0);
                for (j, &a) in alphas.iter().enumerate() {
                    if p_first <= a {
                        size_first[j] += p;
                    }
                    if p_rstar <= a {
                        size_star[j] += p;
                    }
                }
                if mu_hat >= mu0 {
                    // CONTINUITY-CORRECTED ground truth. The saddlepoint tails
                    // `p_first` / `p_rstar` are CONTINUOUS approximations built
                    // from the integer-valued statistic `S = s`, so they target
                    // the lattice tail at the MID-CELL point `s − ½`, i.e. the
                    // continuity-corrected exact tail `½[P(S′ ≥ s) + P(S′ ≥ s+1)]`
                    // — NOT the raw integer atom `P(S′ ≥ s)`. Comparing the
                    // continuous tail against the un-corrected integer tail
                    // introduces a fixed half-integer offset that the cruder
                    // first-order root happens to partially absorb, ALIASING the
                    // MAE so the more-accurate third-order `r*` looks worse. With
                    // the standard mid-cell continuity correction the comparison
                    // is on the lattice point the saddlepoint actually estimates,
                    // and `r*`'s genuine O(n⁻³ᐟ²) sharpening shows through (it is
                    // ~5× closer to the exact tail than the first-order root here).
                    let exact = 0.5 * (exact_upper[s] + exact_upper[s + 1]);
                    tail_err_first += p * (p_first - exact).abs();
                    tail_err_star += p * (p_rstar - exact).abs();
                    mass_upper += p;
                }
            }
            // (1) No-worse-everywhere at fixed α, accumulating the aggregate error.
            for (j, &a) in alphas.iter().enumerate() {
                let err_first = (size_first[j] - a).abs();
                let err_star = (size_star[j] - a).abs();
                assert!(
                    err_star <= err_first + 1e-9,
                    "n={n} α={a}: r* size {:.4} (|Δ|={err_star:.4}) must be no worse than \
                     first-order size {:.4} (|Δ|={err_first:.4})",
                    size_star[j],
                    size_first[j]
                );
                total_err_first += err_first;
                total_err_star += err_star;
            }
            // (2) The un-aliased witness: the r* tail must approximate the EXACT
            // upper-tail probability NO WORSE than the first-order root at every
            // n (a half-integer continuity offset can tie a particular n), and
            // strictly better in aggregate below. pmf-weighted MAE over the upper
            // half.
            let mae_first = tail_err_first / mass_upper;
            let mae_star = tail_err_star / mass_upper;
            assert!(
                mae_star <= mae_first + 1e-12,
                "n={n}: r* tail must approximate the exact Poisson upper tail no worse \
                 than first-order: MAE*={mae_star:.6} must be ≤ MAE={mae_first:.6}"
            );
            total_mae_first += mae_first;
            total_mae_star += mae_star;
        }
        // Aggregate strict improvement, robust to per-point discreteness ties:
        //   (a) the exact-tail MAE summed over all n must strictly drop — r*
        //       genuinely sharpens the tail (the un-aliased, continuous witness);
        //   (b) the discrete rejection-size error summed over all (n, α) must be
        //       no worse — the correction never degrades nominal calibration.
        assert!(
            total_mae_star < total_mae_first - 1e-9,
            "r* must strictly improve the aggregate exact-tail MAE over first-order: \
             Σ MAE*={total_mae_star:.6} must be < Σ MAE={total_mae_first:.6}"
        );
        assert!(
            total_err_star <= total_err_first + 1e-9,
            "r* must not worsen the aggregate discrete size over first-order: \
             Σ|size_r*−α|={total_err_star:.5} must be ≤ Σ|size_r−α|={total_err_first:.5}"
        );
    }
}