pub enum QuantizationPrecision {
FP16,
FP8,
INT8,
INT4,
INT2,
INT1,
Mixed,
Adaptive,
}Expand description
Quantization precision levels
Variants§
FP16
16-bit floating point
FP8
8-bit floating point (E4M3 or E5M2 format)
INT8
8-bit integer
INT4
4-bit integer
INT2
2-bit integer (experimental)
INT1
1-bit binary quantization
Mixed
Mixed precision (FP16 for outliers, INT8 for normal weights)
Adaptive
Adaptive precision based on layer importance
Trait Implementations§
Source§impl Clone for QuantizationPrecision
impl Clone for QuantizationPrecision
Source§fn clone(&self) -> QuantizationPrecision
fn clone(&self) -> QuantizationPrecision
Returns a duplicate of the value. Read more
1.0.0 · Source§fn clone_from(&mut self, source: &Self)
fn clone_from(&mut self, source: &Self)
Performs copy-assignment from
source. Read moreSource§impl Debug for QuantizationPrecision
impl Debug for QuantizationPrecision
Source§impl<'de> Deserialize<'de> for QuantizationPrecision
impl<'de> Deserialize<'de> for QuantizationPrecision
Source§fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where
__D: Deserializer<'de>,
fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where
__D: Deserializer<'de>,
Deserialize this value from the given Serde deserializer. Read more
Source§impl From<QuantizationPrecision> for JsValue
impl From<QuantizationPrecision> for JsValue
Source§fn from(value: QuantizationPrecision) -> Self
fn from(value: QuantizationPrecision) -> Self
Converts to this type from the input type.
Source§impl FromWasmAbi for QuantizationPrecision
impl FromWasmAbi for QuantizationPrecision
Source§impl IntoWasmAbi for QuantizationPrecision
impl IntoWasmAbi for QuantizationPrecision
Source§impl PartialEq for QuantizationPrecision
impl PartialEq for QuantizationPrecision
Source§impl Serialize for QuantizationPrecision
impl Serialize for QuantizationPrecision
Source§impl VectorFromWasmAbi for QuantizationPrecision
impl VectorFromWasmAbi for QuantizationPrecision
type Abi = <Box<[JsValue]> as FromWasmAbi>::Abi
unsafe fn vector_from_abi(js: Self::Abi) -> Box<[QuantizationPrecision]>
Source§impl VectorIntoWasmAbi for QuantizationPrecision
impl VectorIntoWasmAbi for QuantizationPrecision
type Abi = <Box<[JsValue]> as IntoWasmAbi>::Abi
fn vector_into_abi(vector: Box<[QuantizationPrecision]>) -> Self::Abi
Source§impl WasmDescribeVector for QuantizationPrecision
impl WasmDescribeVector for QuantizationPrecision
impl Copy for QuantizationPrecision
impl Eq for QuantizationPrecision
impl StructuralPartialEq for QuantizationPrecision
Auto Trait Implementations§
impl Freeze for QuantizationPrecision
impl RefUnwindSafe for QuantizationPrecision
impl Send for QuantizationPrecision
impl Sync for QuantizationPrecision
impl Unpin for QuantizationPrecision
impl UnsafeUnpin for QuantizationPrecision
impl UnwindSafe for QuantizationPrecision
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more
Source§impl<T> CloneToUninit for Twhere
T: Clone,
impl<T> CloneToUninit for Twhere
T: Clone,
Source§impl<T> ReturnWasmAbi for Twhere
T: IntoWasmAbi,
impl<T> ReturnWasmAbi for Twhere
T: IntoWasmAbi,
Source§type Abi = <T as IntoWasmAbi>::Abi
type Abi = <T as IntoWasmAbi>::Abi
Same as
IntoWasmAbi::AbiSource§fn return_abi(self) -> <T as ReturnWasmAbi>::Abi
fn return_abi(self) -> <T as ReturnWasmAbi>::Abi
Same as
IntoWasmAbi::into_abi, except that it may throw and never
return in the case of Err.