murr 0.2.1

Columnar in-memory cache for AI/ML inference workloads
Documentation
use arrow::{
    array::{Array, ArrayRef},
    datatypes::{DataType, UInt64Type},
};
use serde_json::Value;

use crate::{
    core::{DType, DTypeName, MurrError},
    io::{
        codec::{ArrowCodec, ColumnDecoder, ColumnEncoder, JsonCodec, primitive},
        schema::SegmentColumnSchema,
    },
};

pub struct UInt64;

impl DType for UInt64 {
    fn name(&self) -> DTypeName {
        DTypeName::UInt64
    }
    fn arrow_dtype(&self) -> DataType {
        DataType::UInt64
    }
    fn size(&self) -> usize {
        8
    }
}

impl ArrowCodec for UInt64 {
    fn make_encoder(&self, col: SegmentColumnSchema, rows: usize) -> Box<dyn ColumnEncoder> {
        Box::new(primitive::Encoder::<UInt64Type>::new(col, rows))
    }
    fn make_decoder(
        &self,
        col: SegmentColumnSchema,
        arr: &dyn Array,
    ) -> Result<Box<dyn ColumnDecoder>, MurrError> {
        Ok(Box::new(primitive::Decoder::<UInt64Type>::new(col, arr)?))
    }
}

impl JsonCodec for UInt64 {
    fn to_json(&self, arr: &dyn Array) -> Result<Vec<Value>, MurrError> {
        primitive::to_json::<UInt64Type>(arr)
    }
    fn from_json(&self, vals: &[Value]) -> Result<ArrayRef, MurrError> {
        primitive::from_json::<UInt64Type>(vals)
    }
}

#[cfg(test)]
mod tests {
    use super::*;
    use crate::io::codec::test_util::{assert_json_roundtrip, assert_row_roundtrip};
    use arrow::array::UInt64Array;
    use rstest::rstest;

    #[rstest]
    #[case::null(None)]
    #[case::zero(Some(0))]
    #[case::max(Some(u64::MAX))]
    #[case::mid(Some(7))]
    #[case::above_2_53(Some((1u64 << 53) + 1))]
    fn row_roundtrip(#[case] v: Option<u64>) {
        assert_row_roundtrip(DTypeName::UInt64, &UInt64Array::from(vec![v]));
    }

    #[rstest]
    #[case::null(None)]
    #[case::zero(Some(0))]
    #[case::max(Some(u64::MAX))]
    #[case::mid(Some(7))]
    #[case::above_2_53(Some((1u64 << 53) + 1))]
    fn json_roundtrip(#[case] v: Option<u64>) {
        assert_json_roundtrip(DTypeName::UInt64, &UInt64Array::from(vec![v]));
    }

    #[test]
    fn json_preserves_precision_above_2_53() {
        // 2^53 + 1 cannot survive an f64 detour; serde_json's Number::as_u64 keeps it exact.
        let big: u64 = (1u64 << 53) + 1;
        let arr = UInt64Array::from(vec![Some(big)]);
        let json = UInt64.to_json(&arr).unwrap();
        assert_eq!(json[0], Value::from(big));
    }
}