Struct Qwen2Model

Source

pub struct Qwen2Model { /* private fields */ }

Expand description

Complete Qwen2 model for inference.

Assembles embedding, decoder layers, and LM head into a complete model.

Implementations§

§

impl Qwen2Model

pub fn new(config: &Qwen2Config) -> Self

Create a new Qwen2 model from configuration.

Weights are initialized randomly. Use load() to load pre-trained weights.

pub fn new_uninitialized(config: &Qwen2Config) -> Self

Create an uninitialized Qwen2 model with minimal memory allocation.

The model is not ready for inference until weights are loaded.

pub fn config(&self) -> &Qwen2Config

Get model configuration.

pub fn eval(&mut self)

Set model to evaluation mode (no dropout).

pub fn train(&mut self)

Set model to training mode.

pub fn enable_cache(&mut self)

Enable KV cache for efficient generation.

pub fn disable_cache(&mut self)

Disable KV cache.

pub fn clear_cache(&mut self)

Clear KV cache.

pub fn num_layers(&self) -> usize

Get number of layers.

pub fn weight_names(&self) -> Vec<String>

Get list of weight names following HuggingFace convention.

Returns names like:

model.embed_tokens.weight
model.layers.0.self_attn.q_proj.weight
model.norm.weight
lm_head.weight

pub fn weight_info(&self) -> HashMap<String, Vec<usize>>

Get weight shapes as a map from name to shape.

pub fn weights(&self) -> HashMap<String, Vec<f32>>

Extract accessible weights as a map from name to f32 data.

Returns a map suitable for serialization to SafeTensors format. Note: Currently returns weights from components with public accessors. Full weight export will be enabled when nn modules expose weight accessors.

pub fn num_parameters(&self) -> usize

Get total number of parameters in the model.

pub fn embed_tokens_mut(&mut self) -> &mut Embedding

Get mutable reference to embedding layer.

pub fn layer_mut(&mut self, idx: usize) -> Option<&mut Qwen2DecoderLayer>

Get mutable reference to decoder layer at index.

pub fn norm_mut(&mut self) -> &mut RMSNorm

Get mutable reference to final norm layer.

pub fn lm_head_mut(&mut self) -> &mut Linear

Get mutable reference to language model head.

pub fn lm_head(&self) -> &Linear

Get reference to language model head (for testing/inspection).

pub fn load_from_safetensors(&mut self, path: &Path) -> Result<usize, String>

Load weights from SafeTensors format.

§Arguments

path - Path to .safetensors file

§Returns

Number of weights loaded

§Errors

Returns error if file cannot be read or weights don’t match.

pub fn from_safetensors( config: &Qwen2Config, path: &Path, ) -> Result<Self, String>

Load model from SafeTensors file.

Creates a new model with the given config and loads weights from file.

pub fn load_from_apr(&mut self, path: &Path) -> Result<usize, String>

Load weights from APR v2 format file.

Per Native Library Mandate (Spec §2.4): Uses mmap via bundle::MappedFile for zero-copy tensor access. This is the REQUIRED approach for APR files.

Note: APR canonical names don’t have the “model.” prefix (it’s stripped during import per format/converter.rs). We look for names without prefix.

§Returns

Number of weights loaded

§Errors

Returns error if file cannot be read or weights don’t match.

pub fn from_apr(config: &Qwen2Config, path: &Path) -> Result<Self, String>

Load model from APR v2 format file.

Creates a new model with the given config and loads weights from file.

Qwen2Model

Struct Qwen2Model Copy item path

Implementations§

impl Qwen2Model

pub fn new(config: &Qwen2Config) -> Self

pub fn new_uninitialized(config: &Qwen2Config) -> Self

pub fn config(&self) -> &Qwen2Config

pub fn eval(&mut self)

pub fn train(&mut self)

pub fn enable_cache(&mut self)

pub fn disable_cache(&mut self)

pub fn clear_cache(&mut self)

pub fn num_layers(&self) -> usize

pub fn weight_names(&self) -> Vec<String>

pub fn weight_info(&self) -> HashMap<String, Vec<usize>>

pub fn weights(&self) -> HashMap<String, Vec<f32>>

pub fn num_parameters(&self) -> usize

pub fn embed_tokens_mut(&mut self) -> &mut Embedding

pub fn layer_mut(&mut self, idx: usize) -> Option<&mut Qwen2DecoderLayer>

pub fn norm_mut(&mut self) -> &mut RMSNorm

pub fn lm_head_mut(&mut self) -> &mut Linear

pub fn lm_head(&self) -> &Linear

pub fn load_from_safetensors(&mut self, path: &Path) -> Result<usize, String>

§Arguments

§Returns

§Errors

pub fn from_safetensors( config: &Qwen2Config, path: &Path, ) -> Result<Self, String>

pub fn load_from_apr(&mut self, path: &Path) -> Result<usize, String>

§Returns

§Errors

pub fn from_apr(config: &Qwen2Config, path: &Path) -> Result<Self, String>

Trait Implementations§

impl Debug for Qwen2Model

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Auto Trait Implementations§

impl Freeze for Qwen2Model

impl !RefUnwindSafe for Qwen2Model

impl Send for Qwen2Model

impl Sync for Qwen2Model

impl Unpin for Qwen2Model

impl UnsafeUnpin for Qwen2Model

impl !UnwindSafe for Qwen2Model

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T> IntoEither for T

fn into_either(self, into_left: bool) -> Either<Self, Self>

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>where F: FnOnce(&Self) -> bool,

impl<T> Pointable for T

const ALIGN: usize

type Init = T

unsafe fn init(init: <T as Pointable>::Init) -> usize

unsafe fn deref<'a>(ptr: usize) -> &'a T

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

unsafe fn drop(ptr: usize)

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for Twhere V: MultiLane<T>,

fn vzip(self) -> V

Struct Qwen2Model

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T, U> Into<U> for T
where U: From<T>,

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<V, T> VZip<V> for T
where V: MultiLane<T>,