List of all items
Structs
- AttentionConfig
- ModelConfig
- ModelInfo
- RopeScaling
- architectures::bert::BertModelWrapper
- architectures::llama::Attention
- architectures::llama::Config
- architectures::llama::DecoderLayer
- architectures::llama::LlamaModelWrapper
- architectures::llama::Mlp
- architectures::llama::Model
- architectures::llama::PreAllocKvCache
- architectures::llama::RmsNormWithWeight
- architectures::llama::RotaryEmbedding
- architectures::qwen2::Qwen2ModelWrapper
- architectures::qwen3::Config
- architectures::qwen3::Model
- architectures::qwen3::ModelForCausalLM
- architectures::qwen3::Qwen3ModelWrapper
- builder::DefaultModelBuilderFactory
- builder::SimpleModelBuilder
- definition::ConfigManager
- definition::ModelDefinition
- executor::bert_executor::BertModelExecutor
- executor::candle_executor::CandleModelExecutor
- executor::common::GenericKvCacheHandle
- executor::qwen2_executor::Qwen2ModelExecutor
- executor::qwen3_executor::Qwen3ModelExecutor
- executor::stub_executor::StubModelExecutor
- hf_download::HfDownloader
- loader::gptq_loader::GptqLayerWeights
- loader::gptq_loader::QuantizeConfig
- loader::safetensors_loader::SafeTensorsLoader
- registry::DefaultModelRegistry
- registry::ModelAlias
- registry::ModelDiscoveryEntry
- source::DefaultModelSourceResolver
- source::ModelSourceConfig
- source::ResolvedModelSource
- tensor_wrapper::CandleTensorWrapper
- tokenizer::PlaceholderTokenizer
- tokenizer::TokenizerFactory
- tokenizer::TokenizerHandle
- weights::GGUFLoader
- weights::SafeTensorsLoader
- weights::StubWeightLoader
- weights::WeightLoaderHandle
Enums
Traits
Functions
- executor::common::default_executor_status
- executor::common::tensor_to_tokens
- executor::common::tokens_to_tensor
- executor::common::wrap_tensor
- loader::gptq_loader::load_gptq_weights
- weights::default_weight_loader