Struct GemmaConfig

Source

pub struct GemmaConfig {Show 28 fields
    pub arch: GemmaArch,
    pub vocab_size: usize,
    pub hidden_size: usize,
    pub intermediate_size: usize,
    pub num_hidden_layers: usize,
    pub num_attention_heads: usize,
    pub num_key_value_heads: usize,
    pub max_position_embeddings: usize,
    pub rms_norm_eps: f64,
    pub rope_theta: f64,
    pub tie_word_embeddings: bool,
    pub attention_bias: bool,
    pub head_dim: Option<usize>,
    pub attn_logit_softcapping: Option<f32>,
    pub final_logit_softcapping: Option<f32>,
    pub sliding_window: Option<usize>,
    pub query_pre_attn_scalar: Option<f32>,
    pub effective_num_layers: Option<usize>,
    pub num_experts: usize,
    pub num_experts_used: usize,
    pub expert_ffn_size: usize,
    pub expert_weights_scale: f32,
    pub layer_types: Vec<GemmaLayerType>,
    pub rope_parameters: GemmaRopeMap,
    pub global_head_dim: Option<usize>,
    pub num_global_key_value_heads: Option<usize>,
    pub attention_k_eq_v: bool,
    pub use_bidirectional_attention: Option<String>,
}

Fields§

§arch: GemmaArch§vocab_size: usize§hidden_size: usize§intermediate_size: usize§num_hidden_layers: usize§num_attention_heads: usize§num_key_value_heads: usize§max_position_embeddings: usize§rms_norm_eps: f64§rope_theta: f64§tie_word_embeddings: bool§attention_bias: bool§head_dim: Option<usize>§attn_logit_softcapping: Option<f32>§final_logit_softcapping: Option<f32>§sliding_window: Option<usize>§query_pre_attn_scalar: Option<f32>§effective_num_layers: Option<usize>§num_experts: usize§num_experts_used: usize§expert_ffn_size: usize§expert_weights_scale: f32§layer_types: Vec<GemmaLayerType>

Per-layer attention kind. Empty for Gemma <=3 — fall back to the strided pattern derived from arch.sliding_window_stride.

§rope_parameters: GemmaRopeMap

Per-attention-kind rope settings. Empty for Gemma <=3.

§global_head_dim: Option<usize>

Head dim for full-attention (global) layers. None ⇒ reuse the base head_dim. Gemma 4 12B sets this to 512 while the sliding head_dim stays at 256.

§num_global_key_value_heads: Option<usize>

Num KV heads for full-attention layers. None ⇒ reuse the base num_key_value_heads. Gemma 4 12B sets this to 1.

§attention_k_eq_v: bool

When true (Gemma 4 12B), the K projection is reused as V at load time — weights only ship .k_proj and .v_proj becomes an alias.

§use_bidirectional_attention: Option<String>

When "vision", media placeholder spans use bidirectional attention on sliding layers (Gemma 4 unified).

Struct GemmaConfig Copy item path

Fields§

Implementations§

impl GemmaConfig

pub fn from_file(path: &Path) -> Result<GemmaConfig, Error>

pub fn from_gguf(raw: &GgufFile) -> Result<GemmaConfig, Error>

pub fn head_dim(&self) -> usize

pub fn kv_group_size(&self) -> usize

pub fn q_proj_dim(&self) -> usize

pub fn kv_proj_dim(&self) -> usize

pub fn layer_style(&self) -> GemmaLayerStyle

pub fn active_num_layers(&self) -> usize

pub fn is_moe(&self) -> bool

pub fn use_bidirectional_vision(&self) -> bool

pub fn expert_ffn_dim(&self) -> usize

pub fn attn_score_scale(&self) -> Option<f32>

pub fn layer_attn_options( &self, layer: usize, ) -> (MaskKind, Option<f32>, Option<f32>)

pub fn is_full_attention_layer(&self, layer: usize) -> bool

pub fn layer_head_dim(&self, layer: usize) -> usize

pub fn layer_num_kv_heads(&self, layer: usize) -> usize

pub fn layer_n_rot(&self, layer: usize) -> usize

pub fn layer_rope_theta(&self, layer: usize) -> f64

Trait Implementations§

impl Clone for GemmaConfig

fn clone(&self) -> GemmaConfig

fn clone_from(&mut self, source: &Self)

impl Debug for GemmaConfig

fn fmt(&self, f: &mut Formatter<'_>) -> Result<(), Error>

impl<'de> Deserialize<'de> for GemmaConfig

fn deserialize<__D>( __deserializer: __D, ) -> Result<GemmaConfig, <__D as Deserializer<'de>>::Error>where __D: Deserializer<'de>,

Auto Trait Implementations§

impl Freeze for GemmaConfig

impl RefUnwindSafe for GemmaConfig

impl Send for GemmaConfig

impl Sync for GemmaConfig

impl Unpin for GemmaConfig

impl UnsafeUnpin for GemmaConfig

impl UnwindSafe for GemmaConfig

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<ST, DT> CastableFrom<ST, Initialized, Initialized> for DTwhere ST: ?Sized, DT: ?Sized,

impl<ST, DT> CastableFrom<ST, Uninit, Uninit> for DTwhere ST: ?Sized, DT: ?Sized,

impl<T> CloneToUninit for Twhere T: Clone,

unsafe fn clone_to_uninit(&self, dest: *mut u8)

impl<T> DeserializeOwned for Twhere T: for<'de> Deserialize<'de>,

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> IntoEither for T

fn into_either(self, into_left: bool) -> Either<Self, Self>

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>where F: FnOnce(&Self) -> bool,

impl<T> Pointable for T

const ALIGN: usize

type Init = T

unsafe fn init(init: <T as Pointable>::Init) -> usize

unsafe fn deref<'a>(ptr: usize) -> &'a T

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

unsafe fn drop(ptr: usize)

impl<T> Read<Exclusive, BecauseExclusive> for Twhere T: ?Sized,

impl<T> ToOwned for Twhere T: Clone,

type Owned = T

fn to_owned(&self) -> T

fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for Twhere V: MultiLane<T>,

fn vzip(self) -> V

Struct GemmaConfig

fn deserialize<D>( deserializer: D, ) -> Result<GemmaConfig, <D as Deserializer<'de>>::Error>
where __D: Deserializer<'de>,

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<ST, DT> CastableFrom<ST, Initialized, Initialized> for DT
where ST: ?Sized, DT: ?Sized,

impl<ST, DT> CastableFrom<ST, Uninit, Uninit> for DT
where ST: ?Sized, DT: ?Sized,

impl<T> CloneToUninit for T
where T: Clone,

impl<T> DeserializeOwned for T
where T: for<'de> Deserialize<'de>,

impl<T, U> Into<U> for T
where U: From<T>,

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

impl<T> Read<Exclusive, BecauseExclusive> for T
where T: ?Sized,

impl<T> ToOwned for T
where T: Clone,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<V, T> VZip<V> for T
where V: MultiLane<T>,