Enum Quantization

Source

pub enum Quantization {
    Q4_K_S,
    Q4_K_M,
    Q5_K_S,
    Q5_K_M,
    Q6_K,
    Q8_0,
    F16,
    F32,
}

Expand description

Quantization levels for GGUF models.

Quantization reduces model size and memory usage at the cost of some quality. Lower quantization (Q4) = smaller, faster, less accurate. Higher quantization (F16) = larger, slower, more accurate.

Variants§

§

Q4_K_S

4-bit quantization, small variant (smallest, fastest).

§

Q4_K_M

4-bit quantization, medium variant (recommended for most use cases).

§

Q5_K_S

5-bit quantization, small variant.

§

Q5_K_M

5-bit quantization, medium variant (balanced quality/size).

§

Q6_K

6-bit quantization.

§

Q8_0

8-bit quantization (high quality).

§

F16

16-bit floating point (full precision).

§

F32

32-bit floating point (maximum precision, rarely used).

Implementations§

Source §

impl Quantization

Source

pub const fn name(&self) -> &'static str

Human-readable name for this quantization level.

Source

pub const fn short_name(&self) -> &'static str

Short name without description.

Source

pub const fn memory_multiplier(&self) -> f32

Approximate memory multiplier (bytes per parameter).

Use this to estimate model memory requirements: memory_gb = param_billions * multiplier

Source

pub const fn all() -> &'static [Quantization]

Returns all quantization levels in order from smallest to largest.

Trait Implementations§

Source §

impl Clone for Quantization

Source §

fn clone(&self) -> Quantization

Returns a duplicate of the value. Read more

1.0.0 · Source§

fn clone_from(&mut self, source: &Self)

Performs copy-assignment from source. Read more

Source §

impl Debug for Quantization

Source §

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Formats the value using the given formatter. Read more

Source §

impl Default for Quantization

Source §

fn default() -> Self

Default to Q4_K_M as it provides the best balance of size and quality.

Source §

impl Display for Quantization

Source §

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Formats the value using the given formatter. Read more

Source §

impl Hash for Quantization

Source §

fn hash<H: Hasher>(&self, state: &mut H)

Feeds this value into the given Hasher. Read more

1.3.0 · Source§

fn hash_slice<H>(data: &[Self], state: &mut H)
where H: Hasher, Self: Sized,

Feeds a slice of this type into the given Hasher. Read more

Source §

impl PartialEq for Quantization

Source §

fn eq(&self, other: &Quantization) -> bool

Tests for self and other values to be equal, and is used by ==.

1.0.0 · Source§

fn ne(&self, other: &Rhs) -> bool

Tests for !=. The default implementation is almost always sufficient, and should not be overridden without very good reason.

Source §

impl Copy for Quantization

Source §

impl Eq for Quantization

Source §

impl StructuralPartialEq for Quantization

Auto Trait Implementations§

§

impl UnwindSafe for Quantization

Blanket Implementations§

Source §

impl<T> Any for T
where T: 'static + ?Sized,

Source §

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more

Source §

impl<T> Borrow<T> for T
where T: ?Sized,

Source §

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more

Source §

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source §

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more

Source §

impl<T> CloneToUninit for T
where T: Clone,

Source §

unsafe fn clone_to_uninit(&self, dest: *mut u8)

🔬This is a nightly-only experimental API. (clone_to_uninit)

Performs copy-assignment from self to dest. Read more

Source §

impl<T> From<T> for T

Source §

fn from(t: T) -> T

Returns the argument unchanged.

Source §

impl<T, U> Into for T
where U: From<T>,

Source §

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source §

impl<T> ToOwned for T
where T: Clone,

Source §

type Owned = T

The resulting type after obtaining ownership.

Source §

fn to_owned(&self) -> T

Creates owned data from borrowed data, usually by cloning. Read more

Source §

fn clone_into(&self, target: &mut T)

Uses borrowed data to replace owned data, usually by cloning. Read more

Source §

impl<T> ToString for T
where T: Display + ?Sized,

Source §

fn to_string(&self) -> String

Converts the given value to a String. Read more

Source §

impl<T, U> TryFrom for T
where U: Into<T>,

Source §

type Error = Infallible

The type returned in the event of a conversion error.

Source §

fn try_from(value: U) -> Result<T, <T as TryFrom>::Error>

Performs the conversion.

Source §

impl<T, U> TryInto for T
where U: TryFrom<T>,

Source §

type Error = >::Error

The type returned in the event of a conversion error.

Source §

fn try_into(self) -> Result<U, >::Error>

Performs the conversion.

Enum Quantization Copy item path

Variants§

Q4_K_S

Q4_K_M

Q5_K_S

Q5_K_M

Q6_K

Q8_0

F16

F32

Implementations§

impl Quantization

pub const fn name(&self) -> &'static str

pub const fn short_name(&self) -> &'static str

pub const fn memory_multiplier(&self) -> f32

pub const fn all() -> &'static [Quantization]

Trait Implementations§

impl Clone for Quantization

fn clone(&self) -> Quantization

fn clone_from(&mut self, source: &Self)

impl Debug for Quantization

fn fmt(&self, f: &mut Formatter<'_>) -> Result

impl Default for Quantization

fn default() -> Self

impl Display for Quantization

fn fmt(&self, f: &mut Formatter<'_>) -> Result

impl Hash for Quantization

fn hash<__H: Hasher>(&self, state: &mut __H)

fn hash_slice<H>(data: &[Self], state: &mut H)where H: Hasher, Self: Sized,

impl PartialEq for Quantization

fn eq(&self, other: &Quantization) -> bool

fn ne(&self, other: &Rhs) -> bool

impl Copy for Quantization

impl Eq for Quantization

impl StructuralPartialEq for Quantization

Auto Trait Implementations§

impl Freeze for Quantization

impl RefUnwindSafe for Quantization

impl Send for Quantization

impl Sync for Quantization

impl Unpin for Quantization

impl UnsafeUnpin for Quantization

impl UnwindSafe for Quantization

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> CloneToUninit for Twhere T: Clone,

unsafe fn clone_to_uninit(&self, dest: *mut u8)

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> ToOwned for Twhere T: Clone,

type Owned = T

fn to_owned(&self) -> T

fn clone_into(&self, target: &mut T)

impl<T> ToString for Twhere T: Display + ?Sized,

fn to_string(&self) -> String

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Enum Quantization

fn hash<H: Hasher>(&self, state: &mut H)

fn hash_slice<H>(data: &[Self], state: &mut H)
where H: Hasher, Self: Sized,

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T> CloneToUninit for T
where T: Clone,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T> ToOwned for T
where T: Clone,

impl<T> ToString for T
where T: Display + ?Sized,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,