buffa 0.8.0 - Docs.rs

//! External size cache for linear-time serialization.
//!
//! Protobuf's wire format requires knowing the encoded size of a sub-message
//! before writing it (for the length-delimited prefix). Without caching, each
//! nesting level recomputes all sizes below it — O(depth²) for chains,
//! exponential for branchy trees. prost has this problem.
//!
//! `SizeCache` records sub-message sizes in a `Vec<u32>` indexed by
//! pre-order DFS traversal, populated by `compute_size` and consumed in the
//! same order by `write_to`. Both passes are O(n).
//!
//! The cache is external to message structs — generated types hold no
//! serialization state, so `let Msg { a, b, .. } = m;` is not forced by
//! hidden plumbing fields. A fresh `SizeCache` is constructed inside the
//! provided `Message::encode*` / `ViewEncode::encode*` methods; manual
//! implementers thread it through their `compute_size` / `write_to`.
//!
//! # Traversal-order invariant
//!
//! `reserve`/`set` calls during `compute_size` must occur in the same
//! order as `consume_next` calls during `write_to`. Generated code guarantees
//! this by iterating fields identically in both functions and by guarding
//! both with identical presence checks (both take `&self`, so the message
//! is immutable between passes). Manual `Message` implementations must
//! uphold the same ordering.

use alloc::vec::Vec;
use core::mem::MaybeUninit;

/// Number of nested-message sizes stored inline (no heap allocation).
///
/// `Message::encode*` constructs a fresh `SizeCache` per call, so messages
/// with ≤ `INLINE_CAP` length-delimited sub-messages encode with zero
/// allocation for the cache. 16 covers the vast majority of message shapes
/// (the official protobuf benchmark messages all fit) at 64 bytes of stack.
const INLINE_CAP: usize = 16;

/// Transient pre-order cache of nested-message sizes for the two-pass
/// serialization model (`compute_size` populates, `write_to` consumes).
///
/// `Message::encode` and friends construct and discard a `SizeCache`
/// internally — most callers never name this type. It appears in the
/// `compute_size` / `write_to` signatures so that manual `Message`
/// implementations can thread it through nested-message recursion.
///
/// Storage is a small inline `[u32; 16]` array with a `Vec<u32>` spill for
/// the (uncommon) case of more than 16 nested length-delimited sub-messages,
/// so a fresh cache is allocation-free for typical messages.
///
/// Reusable across encodes: call [`clear`](Self::clear) between uses to
/// retain the spill allocation. `SizeCache` is intentionally not `Clone`
/// — it is transient encode state, not data. Reuse via
/// [`clear()`](Self::clear).
///
/// # Safety invariant
///
/// The inline slots are `MaybeUninit` to avoid zeroing the whole array on every
/// construction (see the field comment). The invariant that keeps the single
/// `unsafe` read in [`consume_next`](Self::consume_next) sound is:
///
/// > every inline slot at an index `< len` has been initialized.
///
/// It is established in exactly one place — [`reserve`](Self::reserve) writes
/// the slot at index `len` *before* incrementing `len` — and `len` only ever
/// grows via `reserve` (which does that write) or resets to `0` via
/// [`clear`](Self::clear). `consume_next` only reads a slot after checking
/// `idx < len`. Because all three methods and the fields are private to this
/// module, no external code (generated or hand-written) can break the
/// invariant: the worst a misuse can do is trip the `idx >= len` overrun panic
/// or read a wrong-but-initialized size — never undefined behavior.
pub struct SizeCache {
    // `MaybeUninit` avoids zeroing the whole array on construction. A fresh
    // cache is built per encode and handed by `&mut` to an out-of-line
    // `compute_size`, so the compiler cannot prove the unused tail is never
    // read and an `[0; INLINE_CAP]` initializer emits `INLINE_CAP / 4` SSE
    // stores on *every* encode (confirmed by disassembly). With `MaybeUninit`
    // only the slots actually used are written. See the type's safety invariant.
    inline: [MaybeUninit<u32>; INLINE_CAP],
    spill: Vec<u32>,
    len: u32,
    cursor: u32,
}

impl core::fmt::Debug for SizeCache {
    fn fmt(&self, f: &mut core::fmt::Formatter<'_>) -> core::fmt::Result {
        // Only the first `len` inline slots are initialized; show those (plus the
        // spill) so the dump is meaningful without reading uninitialized memory.
        let inline_init = (self.len as usize).min(INLINE_CAP);
        // SAFETY: per the type invariant, every inline slot at an index < len is
        // initialized, so this prefix is sound to view as `&[u32]`.
        let inline =
            unsafe { core::slice::from_raw_parts(self.inline.as_ptr().cast::<u32>(), inline_init) };
        f.debug_struct("SizeCache")
            .field("len", &self.len)
            .field("cursor", &self.cursor)
            .field("inline", &inline)
            .field("spill", &self.spill)
            .finish()
    }
}

impl Default for SizeCache {
    #[inline]
    fn default() -> Self {
        Self::new()
    }
}

impl SizeCache {
    /// Create an empty cache. No heap allocation.
    #[inline]
    #[must_use]
    pub const fn new() -> Self {
        Self {
            inline: [MaybeUninit::uninit(); INLINE_CAP],
            spill: Vec::new(),
            len: 0,
            cursor: 0,
        }
    }

    /// Clear the cache for reuse. Retains the spill allocation's capacity.
    #[inline]
    pub fn clear(&mut self) {
        self.spill.clear();
        self.len = 0;
        self.cursor = 0;
    }

    /// Construct a cache that reuses a caller-supplied spill buffer.
    ///
    /// The inline storage is always stack-allocated; only the spill `Vec` ever
    /// heap-allocates, and only for messages with more than 16 nested
    /// length-delimited sub-messages. Handing in a previously-grown buffer makes
    /// such an encode allocation-free for the cache. The buffer is cleared (its
    /// capacity retained). Most callers should reach for a [`SizeCachePool`]
    /// rather than thread buffers by hand.
    #[inline]
    #[must_use]
    pub fn with_spill_buffer(mut spill: Vec<u32>) -> Self {
        spill.clear();
        Self {
            inline: [MaybeUninit::uninit(); INLINE_CAP],
            spill,
            len: 0,
            cursor: 0,
        }
    }

    /// Reclaim the spill buffer for reuse, consuming the cache.
    ///
    /// The returned `Vec` retains whatever capacity the cache grew to; feed it
    /// back into [`with_spill_buffer`](Self::with_spill_buffer) — or let a
    /// [`SizeCachePool`] manage it — so the next encode reuses the allocation.
    #[inline]
    #[must_use]
    pub fn into_spill_buffer(self) -> Vec<u32> {
        self.spill
    }

    /// Reserve a slot for a nested message's size. Call immediately before
    /// recursing into `child.compute_size(cache)`, then fill the slot with
    /// [`set`](Self::set) after the recursion returns. This reserves the slot
    /// in pre-order even though the size is known in post-order.
    ///
    /// Used by generated `compute_size` implementations.
    #[inline]
    pub fn reserve(&mut self) -> usize {
        debug_assert!(self.len < u32::MAX, "SizeCache slot count overflow");
        let idx = self.len as usize;
        if idx < INLINE_CAP {
            // Placeholder so a buggy caller that reserves-without-set reads a
            // deterministic 0, including after `clear()` reuse. This write is
            // ALSO load-bearing for soundness: it establishes the type
            // invariant (slots `< len` are initialized) that makes the
            // `assume_init` in `consume_next` sound. Do not remove it.
            self.inline[idx] = MaybeUninit::new(0);
        } else {
            self.spill.push(0);
        }
        self.len += 1;
        idx
    }

    /// Fill a previously-reserved slot.
    ///
    /// Used by generated `compute_size` implementations.
    ///
    /// # Panics
    ///
    /// Panics if `idx` was not returned by a prior [`reserve`](Self::reserve)
    /// on this cache (i.e. `idx >= len`).
    #[inline]
    #[track_caller]
    pub fn set(&mut self, idx: usize, size: u32) {
        assert!(
            idx < self.len as usize,
            "SizeCache::set: slot {idx} not reserved (len {})",
            self.len
        );
        if idx < INLINE_CAP {
            self.inline[idx] = MaybeUninit::new(size);
        } else {
            self.spill[idx - INLINE_CAP] = size;
        }
    }

    /// Consume the next cached size in pre-order.
    ///
    /// Used by generated `write_to` implementations for length-delimited
    /// nested message headers.
    ///
    /// # Panics
    ///
    /// Panics if the cursor runs past the end of the cache — i.e. if
    /// `write_to` traversal diverges from `compute_size` traversal. For
    /// generated code this indicates a codegen bug; for manual `Message`
    /// implementations it indicates a traversal-order mismatch.
    #[inline]
    #[track_caller]
    pub fn consume_next(&mut self) -> u32 {
        let idx = self.cursor as usize;
        if idx >= self.len as usize {
            Self::overrun(idx, self.len);
        }
        self.cursor += 1;
        if idx < INLINE_CAP {
            // SAFETY: `idx < self.len` (checked above) and, per the type
            // invariant, every inline slot at an index `< len` was initialized
            // by `reserve` before `len` advanced past it (and possibly
            // overwritten by `set`), so this slot is initialized.
            unsafe { self.inline[idx].assume_init() }
        } else {
            self.spill[idx - INLINE_CAP]
        }
    }

    #[cold]
    #[inline(never)]
    #[track_caller]
    fn overrun(idx: usize, len: u32) -> ! {
        panic!(
            "SizeCache cursor overrun: write_to consumed {} slots but \
             compute_size produced {len} (traversal-order mismatch)",
            idx + 1,
        )
    }
}

/// A caller-owned free-list of spill buffers that amortizes the [`SizeCache`]
/// spill allocation across many encodes.
///
/// # When you need it
///
/// Every `encode` / `encoded_len` builds a fresh [`SizeCache`]. The inline
/// storage is free (stack, no zeroing), so for messages with at most 16 nested
/// length-delimited sub-messages there is nothing to pool. Messages that exceed
/// that — deeply nested, repeated-sub-message shapes — spill to a heap `Vec` on
/// *every* encode. Routing those through a pool reuses one allocation instead.
///
/// ## vs. reusing a single [`SizeCache`]
///
/// For plain sequential reuse you don't strictly need a pool: hold one
/// [`SizeCache`] and call [`encode_with_cache`](crate::Message::encode_with_cache)
/// with [`clear`](SizeCache::clear) between encodes. The pool adds two things
/// that bare reuse cannot: it **shrinks an oversized buffer back on return**
/// (`max_capacity`), so one giant message does not pin peak memory for the
/// lifetime of the cache, and it supports **multiple caches checked out at once**
/// (`max_buffers`), so re-entrant or nested encodes each get their own buffer.
/// If neither matters, a single reused `SizeCache` is simpler.
///
/// # Bring your own — buffa holds no global state
///
/// You own the pool and decide its scope and lifetime: keep one in a
/// `thread_local!` for implicit per-thread reuse, or in a request/connection
/// context for reuse that is freed at that boundary. Only the spill `Vec` is
/// pooled; each cache's inline storage stays on the stack, so routing a *small*
/// message through the pool is just a `Vec` pop/push of an empty buffer — no
/// allocation, no thread-local access, no synchronization. The pool is
/// `alloc`-only, so it works in `no_std` builds.
///
/// # Bounds
///
/// Two limits keep memory in check, both set at construction:
///
/// - `max_buffers` — how many spill buffers the free-list retains. `1` suffices
///   for sequential reuse (one cache in flight at a time, e.g. a `thread_local!`
///   pool — see [`sequential`](Self::sequential)); raise it only for re-entrant
///   or nested encodes that hold several caches at once.
/// - `max_capacity` — the cap, in **`u32` slots**, on each retained buffer's
///   capacity. One slot holds one nested sub-message's size; the first 16 are
///   inline-free, so `max_capacity = N` retains up to `N * 4` bytes per buffer
///   and keeps the allocation warm for messages with up to `N + 16` nested
///   sub-messages. Set it at or above your steady-state spill size — below it,
///   every encode regrows the buffer and `release` shrinks it back, which is worse
///   than not pooling. A few hundred is a sensible starting point.
///
/// Passing `0` for either bound disables retention (the pool then always
/// allocates a fresh cache per `acquire`).
///
/// # Example: a thread-local pool
///
/// ```
/// use core::cell::RefCell;
/// use buffa::{Message, SizeCachePool};
///
/// thread_local! {
///     // `const fn new` allows const-initialized thread-locals.
///     static POOL: RefCell<SizeCachePool> = const { RefCell::new(SizeCachePool::sequential(512)) };
/// }
///
/// fn encode_pooled<M: Message>(msg: &M) -> Vec<u8> {
///     let mut buf = Vec::new();
///     POOL.with_borrow_mut(|pool| pool.encode(msg, &mut buf));
///     buf
/// }
/// ```
#[derive(Debug)]
pub struct SizeCachePool {
    free: Vec<Vec<u32>>,
    max_buffers: usize,
    max_capacity: usize,
}

impl SizeCachePool {
    /// Create an empty pool. No heap allocation until the first encode spills.
    ///
    /// `max_buffers` bounds the retained free-list length; `max_capacity` bounds
    /// each retained buffer's element capacity so a single large message cannot
    /// pin its peak allocation. For sequential (non-re-entrant) reuse —
    /// e.g. a `thread_local!` encode buffer — `max_buffers = 1` is enough.
    #[inline]
    #[must_use]
    pub const fn new(max_buffers: usize, max_capacity: usize) -> Self {
        Self {
            free: Vec::new(),
            max_buffers,
            max_capacity,
        }
    }

    /// Create a pool for sequential reuse — one cache checked out at a time.
    ///
    /// Equivalent to [`new(1, max_capacity)`](Self::new); the right choice for a
    /// `thread_local!` or per-request pool where encodes do not nest. Takes only
    /// the `max_capacity` slot cap (see the [type docs](Self#bounds)), avoiding
    /// the two-`usize` ordering ambiguity of [`new`](Self::new) for the common
    /// case.
    #[inline]
    #[must_use]
    pub const fn sequential(max_capacity: usize) -> Self {
        Self::new(1, max_capacity)
    }

    /// Check out a cache, reusing a pooled spill buffer if one is available.
    ///
    /// Pair with [`release`](Self::release) to return it. The convenience methods
    /// ([`encode`](Self::encode), [`encode_view`](Self::encode_view),
    /// [`encoded_len`](Self::encoded_len)) do the acquire/return for you; use
    /// `acquire`/`release` directly only for manual `compute_size` / `write_to`.
    #[inline]
    #[must_use]
    pub fn acquire(&mut self) -> SizeCache {
        match self.free.pop() {
            Some(buf) => SizeCache::with_spill_buffer(buf),
            None => SizeCache::new(),
        }
    }

    /// Return a cache's spill buffer to the pool, honoring both bounds.
    ///
    /// A cache that never spilled, or whose buffer shrank to nothing under a
    /// `max_capacity` of `0`, is dropped rather than retained — the free-list
    /// never holds a zero-capacity buffer that would yield no reuse.
    #[inline]
    pub fn release(&mut self, cache: SizeCache) {
        if self.free.len() >= self.max_buffers {
            return;
        }
        let mut buf = cache.into_spill_buffer();
        // Clear first so `shrink_to` is not floored by the live length.
        buf.clear();
        if buf.capacity() > self.max_capacity {
            buf.shrink_to(self.max_capacity);
        }
        // After the shrink: skip never-spilled (cap 0) and shrunk-to-0 buffers —
        // a zero-capacity slot in the free-list yields no reuse on `acquire`.
        if buf.capacity() == 0 {
            return;
        }
        self.free.push(buf);
    }

    /// Compute a message's encoded length, reusing a pooled spill buffer.
    ///
    /// The pooled equivalent of [`Message::encoded_len`](crate::Message::encoded_len).
    #[inline]
    #[must_use]
    pub fn encoded_len<M: crate::Message>(&mut self, msg: &M) -> u32 {
        let mut cache = self.acquire();
        let len = msg.compute_size(&mut cache);
        self.release(cache);
        len
    }

    /// Encode a message into `buf`, reusing a pooled spill buffer.
    ///
    /// The pooled equivalent of [`Message::encode`](crate::Message::encode).
    #[inline]
    pub fn encode<M: crate::Message>(&mut self, msg: &M, buf: &mut impl bytes::BufMut) {
        let mut cache = self.acquire();
        msg.encode_with_cache(&mut cache, buf);
        self.release(cache);
    }

    /// Encode a borrowed message view into `buf`, reusing a pooled spill buffer.
    ///
    /// The pooled equivalent of [`ViewEncode::encode`](crate::ViewEncode::encode).
    #[inline]
    pub fn encode_view<'a, V: crate::ViewEncode<'a>>(
        &mut self,
        view: &V,
        buf: &mut impl bytes::BufMut,
    ) {
        let mut cache = self.acquire();
        view.encode_with_cache(&mut cache, buf);
        self.release(cache);
    }
}

#[cfg(test)]
mod tests {
    use super::*;

    #[test]
    fn empty_cache_is_default() {
        let c = SizeCache::new();
        assert_eq!(c.len, 0);
        assert_eq!(c.cursor, 0);
        assert!(c.spill.is_empty());
    }

    #[test]
    fn spill_past_inline_cap_preserves_order() {
        const N: usize = INLINE_CAP * 2 + 5;
        let mut c = SizeCache::new();
        let slots: alloc::vec::Vec<usize> = (0..N).map(|_| c.reserve()).collect();
        // Fill in reverse to prove set() addresses by slot index, not push order.
        for (i, &s) in slots.iter().enumerate().rev() {
            c.set(s, i as u32 * 7);
        }
        assert_eq!(c.spill.len(), N - INLINE_CAP);
        for i in 0..N {
            assert_eq!(c.consume_next(), i as u32 * 7);
        }
    }

    #[test]
    fn boundary_at_inline_cap() {
        let mut c = SizeCache::new();
        for i in 0..INLINE_CAP {
            let s = c.reserve();
            c.set(s, i as u32);
        }
        assert!(c.spill.is_empty(), "no spill at exactly INLINE_CAP");
        let s = c.reserve();
        c.set(s, 999);
        assert_eq!(c.spill.len(), 1);
        for i in 0..INLINE_CAP {
            assert_eq!(c.consume_next(), i as u32);
        }
        assert_eq!(c.consume_next(), 999);
    }

    #[test]
    fn reserve_set_next_roundtrip() {
        let mut c = SizeCache::new();
        let s0 = c.reserve();
        let s1 = c.reserve();
        c.set(s0, 10);
        c.set(s1, 20);
        assert_eq!(c.consume_next(), 10);
        assert_eq!(c.consume_next(), 20);
    }

    #[test]
    fn preorder_reservation_with_nested_recursion() {
        // Simulates: root has children [A, B]; A has child X.
        // compute_size pre-order entry: A, X, B
        // write_to consumes in the same order.
        let mut c = SizeCache::new();

        // compute root:
        //   reserve slot for A
        let slot_a = c.reserve();
        //     compute A:
        //       reserve slot for X
        let slot_x = c.reserve();
        //         compute X: leaf, no nested messages, returns 5
        c.set(slot_x, 5);
        //       A returns 7 (includes X's 5 plus framing)
        c.set(slot_a, 7);
        //   reserve slot for B
        let slot_b = c.reserve();
        //     compute B: leaf, returns 3
        c.set(slot_b, 3);

        // write_to root consumes A, X, B in pre-order:
        assert_eq!(c.consume_next(), 7); // A's length prefix
        assert_eq!(c.consume_next(), 5); // X's length prefix (inside A.write_to)
        assert_eq!(c.consume_next(), 3); // B's length prefix
    }

    #[test]
    fn clear_resets_and_retains_capacity() {
        let mut c = SizeCache::new();
        for _ in 0..(INLINE_CAP + 4) {
            c.reserve();
        }
        let cap = c.spill.capacity();
        assert!(cap >= 4);
        c.clear();
        assert_eq!(c.len, 0);
        assert_eq!(c.cursor, 0);
        assert!(c.spill.capacity() >= cap);
        // Reusable after clear:
        let s = c.reserve();
        c.set(s, 99);
        assert_eq!(c.consume_next(), 99);
    }

    #[test]
    fn reserve_without_set_yields_zero() {
        let mut c = SizeCache::new();
        let _ = c.reserve();
        assert_eq!(c.consume_next(), 0);
    }

    #[test]
    fn clear_then_reserve_without_set_yields_zero() {
        let mut c = SizeCache::new();
        for i in 0..(INLINE_CAP + 3) {
            let s = c.reserve();
            c.set(s, (i + 100) as u32);
        }
        c.clear();
        // After clear, a fresh reserve() must overwrite stale inline data.
        let _ = c.reserve();
        assert_eq!(c.consume_next(), 0);
    }

    #[test]
    #[should_panic(expected = "SizeCache cursor overrun")]
    fn next_past_end_panics() {
        let mut c = SizeCache::new();
        c.consume_next();
    }

    /// Exercises the inline/spill boundary with out-of-order `set` and a
    /// `clear`-and-reuse cycle. Run under `cargo +nightly miri test` this is the
    /// mechanical check that `consume_next`'s `assume_init` never reads
    /// uninitialized memory: every `reserve`d slot below `len` must be init.
    #[test]
    fn miri_soundness_interleaved_reserve_set_consume() {
        let mut c = SizeCache::new();
        // Two full inline tiers' worth, crossing the spill boundary.
        let n = INLINE_CAP * 2 + 3;
        let slots: Vec<usize> = (0..n).map(|_| c.reserve()).collect();
        // Fill out of order (reverse) to decouple set order from reserve order.
        for (i, &s) in slots.iter().enumerate().rev() {
            c.set(s, (i as u32).wrapping_mul(3).wrapping_add(1));
        }
        for i in 0..n {
            assert_eq!(c.consume_next(), (i as u32).wrapping_mul(3).wrapping_add(1));
        }
        // Reuse: a shorter run must not read stale/uninit tail slots.
        c.clear();
        let a = c.reserve();
        let b = c.reserve();
        c.set(b, 20);
        // `a` reserved-but-not-set -> deterministic 0 (placeholder write).
        assert_eq!(c.consume_next(), 0);
        assert_eq!(c.consume_next(), 20);
        let _ = a;
    }

    // ── SizeCachePool ────────────────────────────────────────────────────

    /// Drive a cache from the pool through enough reserves to force a spill,
    /// fill the slots, then return it.
    fn spill_and_return(pool: &mut SizeCachePool, slots: usize) {
        let mut c = pool.acquire();
        for i in 0..slots {
            let s = c.reserve();
            c.set(s, i as u32);
        }
        pool.release(c);
    }

    #[test]
    fn with_spill_buffer_clears_and_retains_capacity() {
        let mut donor = Vec::with_capacity(40);
        donor.extend_from_slice(&[7, 7, 7]);
        let cap = donor.capacity();
        let c = SizeCache::with_spill_buffer(donor);
        assert_eq!(c.len, 0);
        assert!(c.spill.is_empty());
        assert!(c.spill.capacity() >= cap, "retains donor capacity");
    }

    #[test]
    fn into_spill_buffer_roundtrips_through_with_spill_buffer() {
        let mut c = SizeCache::new();
        for _ in 0..(INLINE_CAP + 5) {
            c.reserve();
        }
        let buf = c.into_spill_buffer();
        let grown = buf.capacity();
        assert!(grown >= 5);
        let c2 = SizeCache::with_spill_buffer(buf);
        assert!(c2.spill.capacity() >= grown, "allocation reused");
        assert_eq!(c2.len, 0);
    }

    #[test]
    fn pool_reuses_spill_allocation() {
        let mut pool = SizeCachePool::new(4, 1024);
        spill_and_return(&mut pool, INLINE_CAP + 5);
        assert_eq!(pool.free.len(), 1, "spilled buffer retained");
        let grown = pool.free[0].capacity();
        // Next acquire hands back the grown buffer.
        let c = pool.acquire();
        assert!(c.spill.capacity() >= grown, "spill capacity reused");
        assert_eq!(c.len, 0);
    }

    #[test]
    fn pool_does_not_retain_non_spilling_caches() {
        let mut pool = SizeCachePool::new(4, 1024);
        let mut c = pool.acquire();
        let s = c.reserve(); // stays inline, no heap buffer
        c.set(s, 1);
        pool.release(c);
        assert!(pool.free.is_empty(), "empty (cap 0) buffers are not pooled");
    }

    #[test]
    fn pool_respects_max_buffers() {
        let mut pool = SizeCachePool::new(1, 1024);
        for _ in 0..3 {
            spill_and_return(&mut pool, INLINE_CAP + 2);
        }
        assert!(pool.free.len() <= 1, "free-list bounded by max_buffers");
    }

    #[test]
    fn pool_shrinks_oversized_buffer_on_return() {
        let mut pool = SizeCachePool::new(4, 8);
        spill_and_return(&mut pool, INLINE_CAP + 100);
        assert!(
            pool.free[0].capacity() <= 8,
            "oversized buffer shrunk to cap"
        );
    }

    #[test]
    fn pool_acquire_release_default_is_empty() {
        let mut pool = SizeCachePool::new(2, 64);
        let c = pool.acquire(); // empty pool -> fresh cache
        assert_eq!(c.len, 0);
        pool.release(c); // never spilled -> dropped
        assert!(pool.free.is_empty());
    }

    #[test]
    fn pool_sequential_caps_buffers_at_one() {
        let mut pool = SizeCachePool::sequential(1024);
        assert_eq!(pool.max_buffers, 1);
        for _ in 0..3 {
            spill_and_return(&mut pool, INLINE_CAP + 2);
        }
        assert_eq!(pool.free.len(), 1, "sequential retains exactly one buffer");
    }

    #[test]
    fn pool_max_capacity_zero_disables_retention() {
        let mut pool = SizeCachePool::new(4, 0);
        // Even a spilled buffer shrinks to 0 and must not be parked empty.
        spill_and_return(&mut pool, INLINE_CAP + 50);
        assert!(
            pool.free.is_empty(),
            "max_capacity 0 retains no (zero-capacity) buffers"
        );
        // And the pool still yields a usable cache.
        let mut c = pool.acquire();
        let s = c.reserve();
        c.set(s, 9);
        assert_eq!(c.consume_next(), 9);
    }
}