mod boolean;
mod null;
mod offset;
pub use boolean::*;
pub use null::*;
pub use offset::*;
use crate::{ArrowNativeType, Buffer, MutableBuffer};
use std::marker::PhantomData;
#[derive(Debug)]
pub struct BufferBuilder<T: ArrowNativeType> {
buffer: MutableBuffer,
len: usize,
_marker: PhantomData<T>,
}
impl<T: ArrowNativeType> BufferBuilder<T> {
#[inline]
pub fn new(capacity: usize) -> Self {
let buffer = MutableBuffer::new(capacity * std::mem::size_of::<T>());
Self {
buffer,
len: 0,
_marker: PhantomData,
}
}
pub unsafe fn new_from_buffer(buffer: MutableBuffer) -> Self {
let buffer_len = buffer.len();
Self {
buffer,
len: buffer_len / std::mem::size_of::<T>(),
_marker: PhantomData,
}
}
pub fn len(&self) -> usize {
self.len
}
pub fn is_empty(&self) -> bool {
self.len == 0
}
pub fn capacity(&self) -> usize {
let byte_capacity = self.buffer.capacity();
byte_capacity / std::mem::size_of::<T>()
}
#[inline]
pub fn advance(&mut self, i: usize) {
self.buffer.extend_zeros(i * std::mem::size_of::<T>());
self.len += i;
}
#[inline]
pub fn reserve(&mut self, n: usize) {
self.buffer.reserve(n * std::mem::size_of::<T>());
}
#[inline]
pub fn append(&mut self, v: T) {
self.reserve(1);
self.buffer.push(v);
self.len += 1;
}
#[inline]
pub fn append_n(&mut self, n: usize, v: T) {
self.reserve(n);
self.extend(std::iter::repeat_n(v, n))
}
#[inline]
pub fn append_n_zeroed(&mut self, n: usize) {
self.buffer.extend_zeros(n * std::mem::size_of::<T>());
self.len += n;
}
#[inline]
pub fn append_slice(&mut self, slice: &[T]) {
self.buffer.extend_from_slice(slice);
self.len += slice.len();
}
#[inline]
pub fn as_slice(&self) -> &[T] {
unsafe { std::slice::from_raw_parts(self.buffer.as_ptr() as _, self.len) }
}
#[inline]
pub fn as_slice_mut(&mut self) -> &mut [T] {
unsafe { std::slice::from_raw_parts_mut(self.buffer.as_mut_ptr() as _, self.len) }
}
#[inline]
pub fn truncate(&mut self, len: usize) {
self.buffer.truncate(len * std::mem::size_of::<T>());
self.len = self.len.min(len);
}
#[inline]
pub unsafe fn append_trusted_len_iter(&mut self, iter: impl IntoIterator<Item = T>) {
let iter = iter.into_iter();
let len = iter
.size_hint()
.1
.expect("append_trusted_len_iter expects upper bound");
self.reserve(len);
self.extend(iter);
}
#[inline]
pub fn finish(&mut self) -> Buffer {
let buf = std::mem::take(&mut self.buffer);
self.len = 0;
buf.into()
}
#[inline]
pub fn build(self) -> Buffer {
self.buffer.into()
}
}
impl<T: ArrowNativeType> Default for BufferBuilder<T> {
fn default() -> Self {
Self::new(0)
}
}
impl<T: ArrowNativeType> Extend<T> for BufferBuilder<T> {
fn extend<I: IntoIterator<Item = T>>(&mut self, iter: I) {
self.buffer.extend(iter.into_iter().inspect(|_| {
self.len += 1;
}))
}
}
impl<T: ArrowNativeType> From<Vec<T>> for BufferBuilder<T> {
fn from(value: Vec<T>) -> Self {
let buffer = MutableBuffer::from(value);
unsafe { Self::new_from_buffer(buffer) }
}
}
impl<T: ArrowNativeType> FromIterator<T> for BufferBuilder<T> {
fn from_iter<I: IntoIterator<Item = T>>(iter: I) -> Self {
let mut builder = Self::default();
builder.extend(iter);
builder
}
}
#[cfg(test)]
mod tests {
use super::*;
use std::mem;
#[test]
fn default() {
let builder = BufferBuilder::<u32>::default();
assert!(builder.is_empty());
assert!(builder.buffer.is_empty());
assert_eq!(builder.buffer.capacity(), 0);
}
#[test]
fn from_iter() {
let input = [1u16, 2, 3, 4];
let builder = input.into_iter().collect::<BufferBuilder<_>>();
assert_eq!(builder.len(), 4);
assert_eq!(builder.buffer.len(), 4 * mem::size_of::<u16>());
}
#[test]
fn extend() {
let input = [1, 2];
let mut builder = input.into_iter().collect::<BufferBuilder<_>>();
assert_eq!(builder.len(), 2);
builder.extend([3, 4]);
assert_eq!(builder.len(), 4);
}
#[test]
fn truncate_safety() {
let mut builder = BufferBuilder::from(vec![40, -63, 90]);
assert_eq!(builder.len(), 3);
builder.truncate(151);
assert_eq!(builder.len(), 3);
builder.advance(219);
assert_eq!(builder.len(), 222);
let slice = builder.as_slice_mut();
assert_eq!(slice.len(), 222);
}
}