hanzo-engine 0.6.1

Hanzo Engine - fast, flexible LLM inference engine written in Rust.
Documentation
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
pub mod cache;
pub mod config;
pub mod driver;
pub mod logging;
pub mod proposer;
pub(crate) mod staging;
pub mod target;
pub mod verifier;

pub use config::{MtpConfig, SpeculativeConfig};
pub use logging::{SpeculativeAttachInfo, SpeculativeAttachKind};
pub use proposer::{
    SpeculativeKvCache, SpeculativeProposal, SpeculativeProposalBatch, SpeculativeProposeBatchCtx,
    SpeculativeProposer, TargetTokenEmbedder,
};
pub use target::SpeculativeTargetMixin;