use std::sync::Arc;
use vyre_foundation::ir::model::expr::Ident;
use vyre_foundation::ir::{BufferAccess, BufferDecl, DataType, Expr, Node, Program};
pub const OP_ID: &str = "vyre-primitives::math::gaussian_rdp_step";
#[must_use]
pub fn gaussian_rdp_step(alpha: &str, sigma_squared: &str, out: &str, count: u32) -> Program {
if count == 0 {
return crate::invalid_output_program(
OP_ID,
out,
DataType::U32,
format!("Fix: gaussian_rdp_step requires count > 0, got {count}."),
);
}
let t = Expr::InvocationId { axis: 0 };
let denom = Expr::mul(Expr::u32(2), Expr::load(sigma_squared, t.clone()));
let value = Expr::div(Expr::load(alpha, t.clone()), denom);
let body = vec![Node::if_then(
Expr::lt(t.clone(), Expr::u32(count)),
vec![Node::store(out, t, value)],
)];
Program::wrapped(
vec![
BufferDecl::storage(alpha, 0, BufferAccess::ReadOnly, DataType::U32).with_count(count),
BufferDecl::storage(sigma_squared, 1, BufferAccess::ReadOnly, DataType::U32)
.with_count(count),
BufferDecl::storage(out, 2, BufferAccess::ReadWrite, DataType::U32).with_count(count),
],
[256, 1, 1],
vec![Node::Region {
generator: Ident::from(OP_ID),
source_region: None,
body: Arc::new(body),
}],
)
}
#[must_use]
pub fn gaussian_rdp_step_cpu(alpha: &[f64], sigma_squared: &[f64]) -> Vec<f64> {
alpha
.iter()
.zip(sigma_squared.iter())
.map(|(&a, &s2)| a / (2.0 * s2))
.collect()
}
#[must_use]
pub fn rdp_to_dp(rdp: f64, alpha: f64, delta: f64) -> f64 {
if alpha <= 1.0 || !(delta > 0.0 && delta < 1.0) {
return f64::INFINITY;
}
rdp + (1.0 / delta).ln() / (alpha - 1.0)
}
#[cfg(test)]
mod tests {
use super::*;
const EPS: f64 = 1e-10;
fn approx_eq(a: f64, b: f64) -> bool {
(a - b).abs() < EPS * (1.0 + a.abs() + b.abs())
}
#[test]
fn cpu_alpha_2_sigma_1() {
let r = gaussian_rdp_step_cpu(&[2.0], &[1.0]);
assert!(approx_eq(r[0], 1.0));
}
#[test]
fn cpu_doubling_alpha_doubles_rdp() {
let r1 = gaussian_rdp_step_cpu(&[3.0], &[2.0]);
let r2 = gaussian_rdp_step_cpu(&[6.0], &[2.0]);
assert!(approx_eq(r2[0], 2.0 * r1[0]));
}
#[test]
fn cpu_doubling_sigma_squared_halves_rdp() {
let r1 = gaussian_rdp_step_cpu(&[4.0], &[1.0]);
let r2 = gaussian_rdp_step_cpu(&[4.0], &[2.0]);
assert!(approx_eq(r2[0], r1[0] / 2.0));
}
#[test]
fn cpu_batch_independent_lanes() {
let alpha = vec![2.0, 4.0, 8.0];
let s2 = vec![1.0, 2.0, 4.0];
let r = gaussian_rdp_step_cpu(&alpha, &s2);
assert!(approx_eq(r[0], 1.0)); assert!(approx_eq(r[1], 1.0)); assert!(approx_eq(r[2], 1.0)); }
#[test]
fn cpu_mismatched_inputs_truncate_to_complete_pairs() {
let r = gaussian_rdp_step_cpu(&[2.0, 4.0], &[1.0]);
assert_eq!(r.len(), 1);
assert!(approx_eq(r[0], 1.0));
}
#[test]
fn rdp_to_dp_monotone_in_rdp() {
let alpha = 4.0;
let delta = 1e-5;
let e1 = rdp_to_dp(0.5, alpha, delta);
let e2 = rdp_to_dp(1.0, alpha, delta);
assert!(e2 > e1);
}
#[test]
fn rdp_to_dp_known_value() {
let eps = rdp_to_dp(0.0, 2.0, std::f64::consts::E.recip());
assert!(approx_eq(eps, 1.0));
}
#[test]
fn rdp_to_dp_alpha_one_is_conservative_infinity() {
assert!(rdp_to_dp(0.5, 1.0, 0.5).is_infinite());
}
#[test]
fn rdp_to_dp_delta_zero_is_conservative_infinity() {
assert!(rdp_to_dp(0.5, 2.0, 0.0).is_infinite());
}
#[test]
fn ir_program_buffer_layout() {
let p = gaussian_rdp_step("alpha", "s2", "out", 64);
assert_eq!(p.workgroup_size, [256, 1, 1]);
let names: Vec<&str> = p.buffers.iter().map(|b| b.name()).collect();
assert_eq!(names, vec!["alpha", "s2", "out"]);
for buf in p.buffers.iter() {
assert_eq!(buf.count(), 64);
}
}
#[test]
fn zero_count_traps() {
let p = gaussian_rdp_step("a", "s", "o", 0);
assert!(p.stats().trap());
}
}