Trait WeightLoader

Source

pub trait WeightLoader<B: Backend>: Send + Sync {
    // Required methods
    fn load_tensor(&self, name: &str) -> Result<B::Buffer>;
    fn load_linear(&self, name: &str) -> Result<Box<dyn Linear<B>>>;
    fn has_tensor(&self, name: &str) -> bool;
    fn quant_config(&self) -> Option<&QuantConfig>;
}

Required Methods§

Source

fn load_tensor(&self, name: &str) -> Result<B::Buffer>

Load a single tensor by fully qualified name (e.g. "model.embed_tokens.weight").

Source

fn load_linear(&self, name: &str) -> Result<Box<dyn Linear>>

Load a projection as a Linear. The concrete implementation (DenseLinear / GptqLinear / AwqLinear / GgufLinear) depends on the loader’s file format and quant config.

name is the module path without the .weight suffix, e.g. "model.layers.0.self_attn.qkv_proj".

Source