baracuda_kernels::quantize::dynamic_range

Struct DynamicRangeQuantizeArgs

pub struct DynamicRangeQuantizeArgs<'a, TIn: Element, TOut: IntElement> {
    pub input: TensorRef<'a, TIn, 2>,
    pub scale_out: TensorMut<'a, TIn, 1>,
    pub output: TensorMut<'a, TOut, 2>,
}

Expand description

Args bundle for a dynamic_range_quantize launch.

Compared with super::QuantizePerTokenArgs, the caller does NOT supply scale / zero_point — those are computed by the kernel from the runtime dynamic range. The plan writes scale[N] into the caller-supplied scale_out buffer so a downstream dequantize step has access to the same scale.

zero_point is implicit (= 0 for symmetric) and is not materialized.

Fields§

§input: TensorRef<'a, TIn, 2>

Input [N, D] in FP.

§scale_out: TensorMut<'a, TIn, 1>

Per-row scale [N] in FP — written by the kernel.

§output: TensorMut<'a, TOut, 2>

Output [N, D] in int.

Auto Trait Implementations§

§

impl<'a, TIn, TOut> !UnwindSafe for DynamicRangeQuantizeArgs<'a, TIn, TOut>

§

impl<'a, TIn, TOut> Freeze for DynamicRangeQuantizeArgs<'a, TIn, TOut>

§

impl<'a, TIn, TOut> RefUnwindSafe for DynamicRangeQuantizeArgs<'a, TIn, TOut>
where TIn: RefUnwindSafe, TOut: RefUnwindSafe,

§

impl<'a, TIn, TOut> Send for DynamicRangeQuantizeArgs<'a, TIn, TOut>
where TIn: Sync + Send, TOut: Send,

§

impl<'a, TIn, TOut> Sync for DynamicRangeQuantizeArgs<'a, TIn, TOut>
where TIn: Sync, TOut: Sync,

§

DynamicRangeQuantizeArgs

Struct DynamicRangeQuantizeArgs Copy item path

Fields§

Auto Trait Implementations§

impl<'a, TIn, TOut> !UnwindSafe for DynamicRangeQuantizeArgs<'a, TIn, TOut>

impl<'a, TIn, TOut> Freeze for DynamicRangeQuantizeArgs<'a, TIn, TOut>

impl<'a, TIn, TOut> RefUnwindSafe for DynamicRangeQuantizeArgs<'a, TIn, TOut>where TIn: RefUnwindSafe, TOut: RefUnwindSafe,

impl<'a, TIn, TOut> Send for DynamicRangeQuantizeArgs<'a, TIn, TOut>where TIn: Sync + Send, TOut: Send,

impl<'a, TIn, TOut> Sync for DynamicRangeQuantizeArgs<'a, TIn, TOut>where TIn: Sync, TOut: Sync,

impl<'a, TIn, TOut> Unpin for DynamicRangeQuantizeArgs<'a, TIn, TOut>

impl<'a, TIn, TOut> UnsafeUnpin for DynamicRangeQuantizeArgs<'a, TIn, TOut>

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Struct DynamicRangeQuantizeArgs

impl<'a, TIn, TOut> RefUnwindSafe for DynamicRangeQuantizeArgs<'a, TIn, TOut>
where TIn: RefUnwindSafe, TOut: RefUnwindSafe,

impl<'a, TIn, TOut> Send for DynamicRangeQuantizeArgs<'a, TIn, TOut>
where TIn: Sync + Send, TOut: Send,

impl<'a, TIn, TOut> Sync for DynamicRangeQuantizeArgs<'a, TIn, TOut>
where TIn: Sync, TOut: Sync,

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,