pub struct TransformerConfig {
pub num_layers: usize,
pub hidden_size: usize,
pub num_attention_heads: usize,
pub num_kv_heads: usize,
pub head_dim: usize,
pub intermediate_size: usize,
pub vocab_size: usize,
pub max_seq_len: usize,
pub rms_norm_eps: f32,
pub has_qk_norm: bool,
}Expand description
Configuration for a standard transformer decoder.
Fields§
§num_layers: usize§num_attention_heads: usize§num_kv_heads: usize§head_dim: usize§intermediate_size: usize§vocab_size: usize§max_seq_len: usize§rms_norm_eps: f32§has_qk_norm: boolWhether Q/K heads have per-head normalization (Qwen3 has this, Llama doesn’t).
Trait Implementations§
Source§impl Clone for TransformerConfig
impl Clone for TransformerConfig
Source§fn clone(&self) -> TransformerConfig
fn clone(&self) -> TransformerConfig
Returns a duplicate of the value. Read more
1.0.0 · Source§fn clone_from(&mut self, source: &Self)
fn clone_from(&mut self, source: &Self)
Performs copy-assignment from
source. Read moreAuto Trait Implementations§
impl Freeze for TransformerConfig
impl RefUnwindSafe for TransformerConfig
impl Send for TransformerConfig
impl Sync for TransformerConfig
impl Unpin for TransformerConfig
impl UnsafeUnpin for TransformerConfig
impl UnwindSafe for TransformerConfig
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more