opendp 0.14.2-dev.20260401.2

A library of differential privacy algorithms for the statistical analysis of sensitive private data.
use crate::domains::{LazyFrameDomain, SeriesDomain, SeriesElementDomain};
use crate::metrics::{FrameDistance, SymmetricDistance};
use crate::transformations::make_stable_lazyframe;

use super::*;

fn assert_expr_to_physical<DI: 'static + SeriesElementDomain, DO: 'static + SeriesElementDomain>(
    in_elem_domain: DI,
    in_series: Series,
    out_elem_domain: DO,
    out_series: Series,
) -> Fallible<()> {
    let name = in_series.name().clone();
    let in_series_domain = SeriesDomain::new(name.clone(), in_elem_domain);
    let lf_domain = LazyFrameDomain::new(vec![in_series_domain.clone()])?;
    let lf = DataFrame::new(vec![in_series.into_column()])?.lazy();

    let t_binned = make_stable_lazyframe(
        lf_domain,
        FrameDistance(SymmetricDistance),
        lf.clone().with_column(col(name.clone()).to_physical()),
    )?;

    // check that data is transformed as expected
    let expected = DataFrame::new(vec![out_series.into_column()])?;
    let actual = t_binned.invoke(&lf)?.collect()?;
    assert_eq!(expected, actual);

    // check that domain is transformed as expected
    let out_series_domain = SeriesDomain::new(name, out_elem_domain);
    let expected_lf_domain = LazyFrameDomain::new(vec![out_series_domain])?;

    assert_eq!(t_binned.output_domain, expected_lf_domain);

    Ok(())
}

#[test]
fn test_expr_to_physical_categorical() -> Fallible<()> {
    let in_elem_domain = CategoricalDomain::new_with_categories(
        vec!["A", "B", "C", "D"]
            .into_iter()
            .map(PlSmallStr::from)
            .collect(),
    )?;

    let in_series = Series::new("data".into(), ["A", "B", "B", "C", "D"]).cast(
        &DataType::Categorical(Categories::global(), Categories::global().mapping()),
    )?;

    let out_elem_domain = AtomDomain::<u32>::default();
    let out_series = Series::new("data".into(), [0u32, 1, 1, 2, 3]);
    assert_expr_to_physical(in_elem_domain, in_series, out_elem_domain, out_series)
}

#[test]
fn test_expr_to_physical_same() -> Fallible<()> {
    fn assert<D: 'static + SeriesElementDomain>(elem_domain: D, series: Series) -> Fallible<()> {
        assert_expr_to_physical(elem_domain.clone(), series.clone(), elem_domain, series)
    }
    assert(
        AtomDomain::<i32>::default(),
        Series::new("x".into(), [1i32, 4, 7, 3]),
    )?;
    assert(
        AtomDomain::<String>::default(),
        Series::new(
            "x".into(),
            ["C".to_string(), "A".to_string(), "B".to_string()],
        ),
    )?;
    assert(
        AtomDomain::<bool>::default(),
        Series::new("x".into(), [true, false, false]),
    )?;
    assert(
        AtomDomain::<f32>::default(),
        Series::new("x".into(), [1.0f32, 2.0, 7.0]),
    )?;
    Ok(())
}