Struct PackedBlock

Source

pub struct PackedBlock {
    pub bits: u8,
    pub scale: f16,
    pub packed_indices: Vec<u8>,
}

Expand description

A packed quantized block that stores a scale factor and bit-packed indices.

Replaces the former BlockTQ2, BlockTQ3, and BlockTQ4 structs with a single type that tracks its own bit width.

Fields§

§bits: u8

Bit width used for packing (2, 3, or 4).

§scale: f16

Scaling factor (L2-norm of original vector).

§packed_indices: Vec<u8>

Packed indices (layout depends on bits).

Implementations§

Source §

impl PackedBlock

Source

pub fn new(bits: u8, scale: f16, indices: &[u8]) -> Self

Create a new packed block from a scale and a slice of unpacked index values.

The indices are bit-packed internally based on the specified bits width.

Pure Integration: delegates packing to the bit-width-specific helper selected by the pack closure (IOSP lenient-mode closure pattern).

Source

pub fn size_bytes(&self) -> usize

Total size of the block in bytes (2 bytes for f16 scale + packed data).

Source

pub fn from_raw(bits: u8, scale: f16, packed_indices: Vec<u8>) -> Self

Creates a PackedBlock from pre-packed data without re-packing.

Use this to reconstruct blocks from GPU-quantized data that is already in the correct packed layout.

Pure Operation: field assignment only.

Source

pub fn unpack_into(&self, count: usize, buf: &mut Vec<u8>)

Unpacks stored indices into a caller-provided buffer, avoiding allocation.

This is the hot-path variant: reuses the buffer across repeated calls (e.g. inside attention score loops) to eliminate per-key allocations.

Pure Integration: delegates unpacking to the bit-width-specific helper selected by the do_unpack closure (IOSP lenient-mode closure pattern).

Source

pub fn unpack(&self, count: usize) -> Vec<u8> ⓘ

Recover the unpacked index values.

Allocates a fresh buffer. For hot paths, prefer unpack_into with a reusable buffer.

Auto Trait Implementations§

§

impl UnwindSafe for PackedBlock

Blanket Implementations§

Source §

impl<T> Any for T
where T: 'static + ?Sized,

Source §

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more

Source §

impl<T> Borrow<T> for T
where T: ?Sized,

Source §

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more

Source §

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source §

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more

Source §

impl<T> From<T> for T

Source §

fn from(t: T) -> T

Returns the argument unchanged.

Source §

impl<T, U> Into for T
where U: From<T>,

Source §

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source §

impl<T, U> TryFrom for T
where U: Into<T>,

Source §

type Error = Infallible

The type returned in the event of a conversion error.

Source §

fn try_from(value: U) -> Result<T, <T as TryFrom>::Error>

Performs the conversion.

Source §

impl<T, U> TryInto for T
where U: TryFrom<T>,

Source §

type Error = >::Error

The type returned in the event of a conversion error.

Source §

fn try_into(self) -> Result<U, >::Error>

Performs the conversion.

PackedBlock

Struct PackedBlock

Fields§

Implementations§

impl PackedBlock

pub fn new(bits: u8, scale: f16, indices: &[u8]) -> Self

pub fn size_bytes(&self) -> usize

pub fn from_raw(bits: u8, scale: f16, packed_indices: Vec<u8>) -> Self

pub fn unpack_into(&self, count: usize, buf: &mut Vec<u8>)

pub fn unpack(&self, count: usize) -> Vec<u8> ⓘ

Auto Trait Implementations§

impl Freeze for PackedBlock

impl RefUnwindSafe for PackedBlock

impl Send for PackedBlock

impl Sync for PackedBlock

impl Unpin for PackedBlock

impl UnsafeUnpin for PackedBlock

impl UnwindSafe for PackedBlock

Blanket Implementations§

impl<T> Any for T
where T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for T
where T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for T
where T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for T
where U: From<T>,

fn into(self) -> U

impl<T, U> TryFrom<U> for T
where U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Struct PackedBlock Copy item path

Fields§

Implementations§

impl PackedBlock

pub fn new(bits: u8, scale: f16, indices: &[u8]) -> Self

pub fn size_bytes(&self) -> usize

pub fn from_raw(bits: u8, scale: f16, packed_indices: Vec<u8>) -> Self

pub fn unpack_into(&self, count: usize, buf: &mut Vec<u8>)

pub fn unpack(&self, count: usize) -> Vec<u8> ⓘ

Auto Trait Implementations§

impl Freeze for PackedBlock

impl RefUnwindSafe for PackedBlock

impl Send for PackedBlock

impl Sync for PackedBlock

impl Unpin for PackedBlock

impl UnsafeUnpin for PackedBlock

impl UnwindSafe for PackedBlock

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Struct PackedBlock

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,