ferrum-kv 0.7.4

KV cache management with PagedAttention for Ferrum inference
Documentation
1
2
3
4
5
pub mod compression;
pub mod prefix;

pub use compression::{CompressionManager, NoCompression};
pub use prefix::PrefixCache;