cowstr 0.11.0 - Docs.rs

use core::mem::{align_of, size_of};
use std::alloc;
use std::alloc::Layout;
use std::ptr::{addr_of_mut, NonNull};

#[cfg(not(feature = "multithreaded"))]
use std::cell::Cell;

#[cfg(feature = "multithreaded")]
use std::sync::atomic::{fence, AtomicUsize, Ordering};

#[cfg(feature = "multithreaded")]
use parking_lot::Mutex;

use crate::CapacityError;

/// The inner reference counted String alike
#[cfg(feature = "multithreaded")]
#[derive(Debug)]
#[repr(C, align(32))]
pub(crate) struct RcString {
    refcount: AtomicUsize,
    len: AtomicUsize,
    capacity: usize,
    push_lock: Mutex<()>, // protect data and len on try_push
    data: [u8; 0],
}

#[cfg(not(feature = "multithreaded"))]
#[derive(Debug)]
#[repr(C, align(32))]
pub(crate) struct RcString {
    refcount: Cell<usize>,
    len: Cell<usize>,
    capacity: usize,
    data: [u8; 0],
}

const RCSTRING_SIZE: usize = size_of::<RcString>();
const RCSTRING_ALIGN: usize = align_of::<RcString>();

impl RcString {
    pub(crate) fn allocate(capacity: usize) -> NonNull<Self> {
        unsafe {
            let layout = Layout::from_size_align_unchecked(
                capacity
                    .checked_add(RCSTRING_SIZE)
                    .expect("Capacity overflow"),
                RCSTRING_ALIGN,
            );

            let rcstring = alloc::alloc(layout) as *mut Self;
            if rcstring.is_null() {
                alloc::handle_alloc_error(layout);
            }

            #[cfg(feature = "multithreaded")]
            addr_of_mut!((*rcstring).refcount).write(AtomicUsize::new(1usize));
            #[cfg(not(feature = "multithreaded"))]
            addr_of_mut!((*rcstring).refcount).write(Cell::new(1usize));

            #[cfg(feature = "multithreaded")]
            addr_of_mut!((*rcstring).len).write(AtomicUsize::new(0));
            #[cfg(not(feature = "multithreaded"))]
            addr_of_mut!((*rcstring).len).write(Cell::new(0));

            addr_of_mut!((*rcstring).capacity).write(layout.size() - RCSTRING_SIZE);

            #[cfg(feature = "multithreaded")]
            addr_of_mut!((*rcstring).push_lock).write(Mutex::new(()));

            NonNull::new_unchecked(rcstring)
        }
    }

    pub(crate) fn grow(this: NonNull<Self>, reserve: usize) -> NonNull<Self> {
        unsafe {
            debug_assert_eq!(this.as_ref().strong_count(), 1);

            let layout = Layout::from_size_align_unchecked(
                this.as_ref().capacity + RCSTRING_SIZE,
                RCSTRING_ALIGN,
            );

            let min_new_size = (this.as_ref().len_relaxed() + RCSTRING_SIZE)
                .checked_add(reserve)
                .expect("Capacity overflow");

            let new_size = DEFAULT_ALLOCATION_STRATEGY
                .grow(layout.size(), min_new_size)
                .expect("Capacity overflow");

            let rcstring = alloc::realloc(this.as_ptr() as *mut u8, layout, new_size) as *mut Self;
            if rcstring.is_null() {
                alloc::handle_alloc_error(layout);
            }

            addr_of_mut!((*rcstring).capacity).write(new_size - RCSTRING_SIZE);

            NonNull::new_unchecked(rcstring)
        }
    }

    pub(crate) fn shrink(this: NonNull<Self>, new_capacity: usize) -> NonNull<Self> {
        unsafe {
            debug_assert_eq!(this.as_ref().strong_count(), 1);

            let layout = Layout::from_size_align_unchecked(
                this.as_ref().capacity + RCSTRING_SIZE,
                RCSTRING_ALIGN,
            );

            let new_size = DEFAULT_ALLOCATION_STRATEGY.align(
                (this.as_ref().len_relaxed() + RCSTRING_SIZE).max(new_capacity + RCSTRING_SIZE),
            );

            if new_size < layout.size() {
                // really shrink
                let rcstring =
                    alloc::realloc(this.as_ptr() as *mut u8, layout, new_size) as *mut Self;
                if rcstring.is_null() {
                    let layout = Layout::from_size_align_unchecked(new_size, RCSTRING_ALIGN);
                    alloc::handle_alloc_error(layout);
                }

                addr_of_mut!((*rcstring).capacity).write(new_size - RCSTRING_SIZE);

                NonNull::new_unchecked(rcstring)
            } else {
                /* no-op */
                this
            }
        }
    }

    /// Unconditionally deallocates a `RcString`.
    ///
    /// # Safety
    ///
    /// Must only be called with a valid `RcString` pointer whose refcount is zero.
    // the only side effect here is that the memory becomes freed, which we don't care to test
    #[mutants::skip]
    pub(crate) unsafe fn dealloc(this: NonNull<Self>) {
        debug_assert_eq!(this.as_ref().strong_count(), 0);
        let layout = Layout::from_size_align_unchecked(
            this.as_ref().capacity + RCSTRING_SIZE,
            RCSTRING_ALIGN,
        );
        alloc::dealloc(this.as_ptr() as *mut u8, layout);
    }

    /// Creates a new `RcString` from a &[u8] with some spare capacity.
    ///
    /// Safety:
    ///
    /// The source must be valid utf-8
    unsafe fn from_bytes_unchecked(source: &[u8], reserve: usize) -> NonNull<Self> {
        let mut rcstring = Self::allocate(
            source
                .len()
                .checked_add(reserve)
                .expect("Capacity overflow"),
        );

        // TODO: miri will complain here
        //
        // error: Undefined Behavior: attempting a write access using <198665> at
        //        alloc82691[0x18], but that tag does not exist in the borrow stack for this
        //        location
        //
        // help: <198665> would have been created here, but this is a zero-size retag
        //       ([0x18..0x18]) so the tag in question does not exist anywhere
        //
        // Since RcString is repr(C) and its .data is a ZST and we want RcString pointers to
        // be thin pointer there is currently no way around this. Eventually RcString should
        // become a DST with `data: [u8]` while still passing a thin pointer around. Though this
        // would need ptr::from/to_raw_parts which are currently unstable.
        std::ptr::copy_nonoverlapping(
            source.as_ptr(),
            rcstring.as_mut().data.as_mut_ptr(),
            source.len(),
        );

        rcstring.as_mut().len_set_release(source.len());

        rcstring
    }

    /// Creates a new `RcString` from a &str with some spare capacity.
    #[inline]
    pub(crate) fn from_str(source: &str, reserve: usize) -> NonNull<Self> {
        // Safety: source is a valid utf-8 string
        unsafe { Self::from_bytes_unchecked(source.as_bytes(), reserve) }
    }

    /// Appends the given `char` to the end of this `RcString`.
    ///
    /// # Panics
    ///
    /// There is not enough space available. The capacity has to be extended before calling
    /// this.
    #[inline]
    pub(crate) fn push(&mut self, ch: char) {
        let mut buf = [0u8; 4];
        let bytes = ch.encode_utf8(&mut buf).as_bytes();

        assert!(self.spare_capacity() >= bytes.len());

        unsafe {
            std::ptr::copy_nonoverlapping(
                bytes.as_ptr(),
                self.data.as_mut_ptr().add(self.len_relaxed()),
                bytes.len(),
            );
        }
        self.len_add_release(bytes.len());
    }

    /// Tries to append the given `char` to the end of this `RcString`.
    /// This locks the string for appending and will fail when there is not enough spare capacity.
    pub(crate) unsafe fn try_push_locked(&self, ch: char) -> Result<(), CapacityError> {
        let mut buf = [0u8; 4];
        let bytes = ch.encode_utf8(&mut buf).as_bytes();

        #[cfg(feature = "multithreaded")]
        let _lock = self.push_lock.lock();
        if self.spare_capacity() >= bytes.len() {
            std::ptr::copy_nonoverlapping(
                bytes.as_ptr(),
                // can be safely cast to *mut here because we write into the uninitialized
                // locked part
                (self.data.as_ptr() as *mut u8).add(self.len_relaxed()),
                bytes.len(),
            );

            self.len_add_release(bytes.len());
            Ok(())
        } else {
            Err(CapacityError)
        }
    }

    /// Appends the given `str` to the end of this `RcString`.
    ///
    /// # Panics
    ///
    /// There is not enough space available. The capacity has to be extended before calling
    /// this.
    #[inline]
    pub(crate) fn push_str(&mut self, s: &str) {
        assert!(self.spare_capacity() >= s.len());

        unsafe {
            std::ptr::copy_nonoverlapping(
                s.as_ptr(),
                self.data.as_mut_ptr().add(self.len_relaxed()),
                s.len(),
            );
        }
        self.len_add_release(s.len());
    }

    /// Tries to appends the given `str` to the end of this `RcString`.
    /// This locks the string for appending and will fail when there is not enough spare capacity.
    pub(crate) unsafe fn try_push_str_locked(&self, s: &str) -> Result<(), CapacityError> {
        #[cfg(feature = "multithreaded")]
        let _lock = self.push_lock.lock();
        if self.spare_capacity() >= s.len() {
            std::ptr::copy_nonoverlapping(
                s.as_ptr(),
                // can be safely cast to *mut here because we write into the uninitialized
                // locked part
                (self.data.as_ptr() as *mut u8).add(self.len_relaxed()),
                s.len(),
            );
            self.len_add_release(s.len());
            Ok(())
        } else {
            Err(CapacityError)
        }
    }

    /// Get len from atomic or Cell with relaxed semantic.
    #[cfg(feature = "multithreaded")]
    #[inline(always)]
    fn len_relaxed(&self) -> usize {
        self.len.load(Ordering::Relaxed)
    }

    #[doc(hidden)]
    #[cfg(not(feature = "multithreaded"))]
    #[inline(always)]
    fn len_relaxed(&self) -> usize {
        self.len.get()
    }

    /// Get len from atomic or Cell with Acquire semantic.
    #[cfg(feature = "multithreaded")]
    #[inline(always)]
    fn len_acquire(&self) -> usize {
        self.len.load(Ordering::Acquire)
    }

    #[doc(hidden)]
    #[inline(always)]
    #[cfg(not(feature = "multithreaded"))]
    fn len_acquire(&self) -> usize {
        self.len.get()
    }

    /// Add 'n' to the length with Release semantic.
    #[inline(always)]
    fn len_add_release(&self, n: usize) {
        #[cfg(feature = "multithreaded")]
        self.len.fetch_add(n, Ordering::Release);
        #[cfg(not(feature = "multithreaded"))]
        self.len.set(self.len.get() + n);
    }

    /// Sets a new length with Release semantic.
    #[inline(always)]
    fn len_set_release(&self, n: usize) {
        #[cfg(feature = "multithreaded")]
        self.len.store(n, Ordering::Release);
        #[cfg(not(feature = "multithreaded"))]
        self.len.set(n);
    }

    /// Returns self as &str
    #[inline]
    pub(crate) fn as_str(&self) -> &str {
        unsafe {
            std::str::from_utf8_unchecked(std::slice::from_raw_parts(
                self.data.as_ptr(),
                self.len_acquire(),
            ))
        }
    }

    /// Returns self as &mut str
    #[inline]
    pub(crate) fn as_mut_str(&mut self) -> &mut str {
        unsafe {
            std::str::from_utf8_unchecked_mut(std::slice::from_raw_parts_mut(
                self.data.as_mut_ptr(),
                self.len_acquire(),
            ))
        }
    }

    /// Returns the amount of bytes that can be pushed without reallocation.
    /// This is an acquire fenced load allowing any further access to be relaxed.
    #[inline]
    pub(crate) fn spare_capacity(&self) -> usize {
        self.capacity - self.len_acquire()
    }

    /// Returns the capacity of the allocation.
    #[inline]
    pub(crate) fn capacity(&self) -> usize {
        self.capacity
    }

    #[inline]
    #[cfg(feature = "multithreaded")]
    #[mutants::skip] /* mutants reports this for unknown reasons */
    pub(crate) fn strong_count(&self) -> usize {
        self.refcount.load(Ordering::Relaxed)
    }

    #[inline]
    #[cfg(not(feature = "multithreaded"))]
    #[mutants::skip] /* mutants reports this for unknown reasons */
    pub(crate) fn strong_count(&self) -> usize {
        self.refcount.get()
    }

    #[cfg(feature = "multithreaded")]
    #[mutants::skip] /* mutants reports this for unknown reasons */
    pub(crate) fn increment_strong_count(&self) {
        self.refcount.fetch_add(1, Ordering::Relaxed);
    }

    #[cfg(not(feature = "multithreaded"))]
    #[mutants::skip] /* mutants reports this for unknown reasons */
    pub(crate) fn increment_strong_count(&self) {
        self.refcount.set(self.refcount.get() + 1);
    }

    #[cfg(not(feature = "multithreaded"))]
    #[mutants::skip] /* mutants reports this for unknown reasons */
    pub(crate) fn decrement_strong_count(&self) -> bool {
        let count = self.refcount.get();
        self.refcount.set(count - 1);
        count == 1
    }

    #[cfg(feature = "multithreaded")]
    #[mutants::skip] /* mutants reports this for unknown reasons */
    pub(crate) fn decrement_strong_count(&self) -> bool {
        if self.refcount.fetch_sub(1, Ordering::Release) == 1 {
            fence(Ordering::Acquire);
            true
        } else {
            false
        }
    }
}

#[test]
fn refcounting() {
    let rcptr = RcString::from_str("foobar", 0);
    unsafe {
        let rcstr = rcptr.as_ref();
        assert_eq!(rcstr.strong_count(), 1);

        rcstr.increment_strong_count();
        assert_eq!(rcstr.strong_count(), 2);

        rcstr.decrement_strong_count();
        assert_eq!(rcstr.strong_count(), 1);

        rcstr.decrement_strong_count();
        RcString::dealloc(rcptr);
    }
}

const KB: usize = 1024;
const MB: usize = KB * 1024;
const GB: usize = MB * 1024;

/// The allocation strategy when resizing an allocation
struct AllocationStrategy {
    /// Minimum allocation size returned
    pub min_allocation: usize,
    /// first cut, below this the allocations will be doubled, above until grow_const they will be increased by 50%
    pub grow_half: usize,
    /// second cut, above this allocation will grow constantly by grow_const/2
    pub grow_const: usize,
}

const DEFAULT_ALLOCATION_STRATEGY: AllocationStrategy = AllocationStrategy {
    min_allocation: 32,
    grow_half: 8 * MB,
    grow_const: /* 1 */ GB,
};

impl AllocationStrategy {
    /// returns the new size that shall be allocated, either per allocation strategy or when
    /// that is not sufficient, the `minimum_needed` size rounded up to a multiple of `min_allocation`.
    #[inline]
    pub fn grow(&self, old_size: usize, minimum_needed: usize) -> Option<usize> {
        Some(
            self.align(
                if old_size < self.min_allocation {
                    self.min_allocation
                } else if old_size < self.grow_half {
                    old_size.checked_mul(2)?
                } else if old_size < self.grow_const {
                    old_size.checked_add(old_size / 2)?
                } else {
                    old_size.checked_add(self.grow_const / 2)?
                }
                .max(minimum_needed),
            ),
        )
    }

    /// rounds/aligns the size by the `min_allocation` bytes
    #[inline]
    pub fn align(&self, size: usize) -> usize {
        if size > 0 {
            // TODO: when stable .next_multiple_of(self.min_allocation)
            size | (self.min_allocation - 1)
        } else {
            0
        }
    }
}