Struct Qwen35Config

Source

pub struct Qwen35Config {Show 26 fields
    pub vocab_size: usize,
    pub hidden_size: usize,
    pub intermediate_size: usize,
    pub num_hidden_layers: usize,
    pub nextn_predict_layers: usize,
    pub num_attention_heads: usize,
    pub num_key_value_heads: usize,
    pub key_length: usize,
    pub value_length: usize,
    pub max_position_embeddings: usize,
    pub rms_norm_eps: f64,
    pub rope_theta: f64,
    pub rope_dim_count: usize,
    pub rope_dim_sections: Vec<usize>,
    pub full_attention_interval: usize,
    pub ssm_conv_kernel: usize,
    pub ssm_group_count: usize,
    pub ssm_inner_size: usize,
    pub ssm_state_size: usize,
    pub ssm_time_step_rank: usize,
    pub tie_word_embeddings: bool,
    pub num_experts: usize,
    pub num_experts_used: usize,
    pub expert_ffn_size: usize,
    pub shared_expert_ffn_size: usize,
    pub expert_weights_scale: f32,
}

Expand description

Qwen3.5 model config — fields covering both the per-layer Mamba+ Attention block and the MTP head.

Fields§

§vocab_size: usize§hidden_size: usize§intermediate_size: usize§num_hidden_layers: usize

Total layer count (= main layers + nextn_predict_layers MTP heads).

§nextn_predict_layers: usize

Layers at index < num_hidden_layers - nextn_predict_layers use the hybrid Mamba+Attention block. The remaining nextn_predict_layers layers use standard attention for MTP.

§num_attention_heads: usize§num_key_value_heads: usize§key_length: usize

Per-head Q dim. The MTP attention head uses this.

§value_length: usize

Per-head V dim.

§max_position_embeddings: usize§rms_norm_eps: f64§rope_theta: f64§rope_dim_count: usize§rope_dim_sections: Vec<usize>§full_attention_interval: usize

Some Qwen3.5 layers do full attention every N blocks (interspersed with the Mamba-style blocks). Read but not yet acted on.

§ssm_conv_kernel: usize§ssm_group_count: usize§ssm_inner_size: usize§ssm_state_size: usize§ssm_time_step_rank: usize§tie_word_embeddings: bool§num_experts: usize

MoE (qwen35moe): routed expert count. Zero for dense models.

§num_experts_used: usize

Top-k experts activated per token.

§expert_ffn_size: usize

Per-expert FFN inner dim (qwen35.expert_feed_forward_length).

§shared_expert_ffn_size: usize

Shared-expert FFN inner dim (qwen35.expert_shared_feed_forward_length).

§expert_weights_scale: f32

Router weight multiplier applied after softmax (llama.cpp default 1.0).

Struct Qwen35Config Copy item path

Fields§

Implementations§

impl Qwen35Config

pub fn from_gguf(raw: &GgufFile) -> Result<Qwen35Config, Error>

pub fn is_moe(&self) -> bool

pub fn expert_ffn_dim(&self) -> usize

pub fn shared_expert_ffn_dim(&self) -> usize

pub fn mtp_layer_start(&self) -> Option<usize>

pub fn from_hf_config_json(path: &Path) -> Result<Qwen35Config, Error>

Trait Implementations§

impl Clone for Qwen35Config

fn clone(&self) -> Qwen35Config

fn clone_from(&mut self, source: &Self)

impl Debug for Qwen35Config

fn fmt(&self, f: &mut Formatter<'_>) -> Result<(), Error>

Auto Trait Implementations§

impl Freeze for Qwen35Config

impl RefUnwindSafe for Qwen35Config

impl Send for Qwen35Config

impl Sync for Qwen35Config

impl Unpin for Qwen35Config

impl UnsafeUnpin for Qwen35Config

impl UnwindSafe for Qwen35Config

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<ST, DT> CastableFrom<ST, Initialized, Initialized> for DTwhere ST: ?Sized, DT: ?Sized,

impl<ST, DT> CastableFrom<ST, Uninit, Uninit> for DTwhere ST: ?Sized, DT: ?Sized,

impl<T> CloneToUninit for Twhere T: Clone,

unsafe fn clone_to_uninit(&self, dest: *mut u8)

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> IntoEither for T

fn into_either(self, into_left: bool) -> Either<Self, Self>

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>where F: FnOnce(&Self) -> bool,

impl<T> Pointable for T

const ALIGN: usize

type Init = T

unsafe fn init(init: <T as Pointable>::Init) -> usize

unsafe fn deref<'a>(ptr: usize) -> &'a T

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

unsafe fn drop(ptr: usize)

impl<T> Read<Exclusive, BecauseExclusive> for Twhere T: ?Sized,

impl<T> ToOwned for Twhere T: Clone,

type Owned = T

fn to_owned(&self) -> T

fn clone_into(&self, target: &mut T)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for Twhere V: MultiLane<T>,

fn vzip(self) -> V

Struct Qwen35Config

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<ST, DT> CastableFrom<ST, Initialized, Initialized> for DT
where ST: ?Sized, DT: ?Sized,

impl<ST, DT> CastableFrom<ST, Uninit, Uninit> for DT
where ST: ?Sized, DT: ?Sized,

impl<T> CloneToUninit for T
where T: Clone,

impl<T, U> Into<U> for T
where U: From<T>,

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

impl<T> Read<Exclusive, BecauseExclusive> for T
where T: ?Sized,

impl<T> ToOwned for T
where T: Clone,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<V, T> VZip<V> for T
where V: MultiLane<T>,