Struct Arena

Source

pub struct Arena {
    pub buffer: Buffer,
    pub f16_buffer: Option<Buffer>,
    pub offsets: HashMap<NodeId, usize>,
    pub lens: HashMap<NodeId, usize>,
    pub size: usize,
    pub scratch_off: usize,
    pub scratch_bytes: usize,
}

Expand description

One contiguous arena buffer + per-node byte offsets. Lives for the entire executable graph’s lifetime.

Fields§

§buffer: Buffer

Underlying GPU buffer. Bound as a single STORAGE_READ_WRITE resource for every kernel; offsets disambiguate per-node access.

§f16_buffer: Option<Buffer>

Optional shadow buffer holding f16 versions of every value written via write_f32. Sized at half the arena byte budget (each f32 element pairs with an f16 element at the same logical index — i.e. f16_off = f32_off / 2). Created only when the device exposes the SHADER_F16 feature; matmul kernels with f16-typed B input bind both buffer (for f32 activations) and f16_buffer (for f16 weights). Halves global memory traffic on the dominant matmul reads.

§offsets: HashMap<NodeId, usize>

Per-node byte offset into buffer.

§lens: HashMap<NodeId, usize>

Per-node byte length.

§size: usize

Total arena size in bytes.

§scratch_off: usize

Byte offset of the tail scratch zone (also size - scratch_bytes). Set when callers request scratch via from_plan_with_scratch. Reuseable across ops since scratch is temporary — only one op writes to it at a time within a schedule.

§scratch_bytes: usize

Size in bytes of the tail scratch zone (0 when not used).

Struct Arena Copy item path

Fields§

Implementations§

impl Arena

pub fn from_plan_with_scratch( device: &Device, plan: &MemoryPlan, scratch_bytes: usize, ) -> Self

pub fn from_plan(device: &Device, plan: &MemoryPlan) -> Self

pub fn has(&self, id: NodeId) -> bool

pub fn offset(&self, id: NodeId) -> usize

pub fn len_of(&self, id: NodeId) -> usize

pub fn param_fits_f16_mirror(&self, id: NodeId) -> bool

pub fn set_actual_len(&mut self, id: NodeId, bytes: usize)

pub fn write_f32(&self, queue: &Queue, id: NodeId, data: &[f32])

pub fn write_f16_shadow(&self, queue: &Queue, id: NodeId, data: &[f32])

pub fn read_f32(&self, device: &Device, queue: &Queue, id: NodeId) -> Vec<f32>

pub fn read_bytes_range( &self, device: &Device, queue: &Queue, byte_off: usize, len: usize, ) -> Vec<u8> ⓘ

pub fn write_bytes_range(&self, queue: &Queue, byte_off: usize, data: &[u8])

Auto Trait Implementations§

impl !RefUnwindSafe for Arena

impl !UnwindSafe for Arena

impl Freeze for Arena

impl Send for Arena

impl Sync for Arena

impl Unpin for Arena

impl UnsafeUnpin for Arena

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> IntoEither for T

fn into_either(self, into_left: bool) -> Either<Self, Self>

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>where F: FnOnce(&Self) -> bool,

impl<T> Pointable for T

const ALIGN: usize

type Init = T

unsafe fn init(init: <T as Pointable>::Init) -> usize

unsafe fn deref<'a>(ptr: usize) -> &'a T

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

unsafe fn drop(ptr: usize)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<T> WasmNotSend for Twhere T: Send,

impl<T> WasmNotSendSync for Twhere T: WasmNotSend + WasmNotSync,

impl<T> WasmNotSync for Twhere T: Sync,

Struct Arena

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T, U> Into<U> for T
where U: From<T>,

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<T> WasmNotSend for T
where T: Send,

impl<T> WasmNotSendSync for T
where T: WasmNotSend + WasmNotSync,

impl<T> WasmNotSync for T
where T: Sync,