Skip to main content

fib_quant/kv/
mod.rs

1//! KV-cache compression contracts and CPU reference paths.
2//!
3//! The `kv` feature is experimental and default-off. It provides typed
4//! contracts, role-aware policy decisions, and CPU reference encode/decode
5//! helpers for KV-cache pages. It is not a production serving backend.
6
7pub mod attention_ref;
8pub mod block;
9pub mod calibration;
10pub mod codec;
11pub mod layout;
12pub mod page;
13pub mod policy;
14pub mod profile;
15pub mod quality;
16pub mod receipt;
17pub mod shape;
18
19pub use attention_ref::{
20    compare_attention_fixture, reference_attention_logits, reference_value_aggregation,
21};
22pub use block::{KvBlockEncodingV1, KvEncodedBlockV1};
23pub use calibration::{calibrate_kv_tensor, KvCalibrationSummaryV1};
24pub use codec::{decode_kv_pages, encode_kv_tensor, KvDecodedTensorV1, KvEncodedTensorV1};
25pub use layout::{KvCacheLayoutV1, KvLayoutOrder, KvPageGeometryV1};
26pub use page::KvEncodedPageV1;
27pub use policy::{
28    decide_kv_compression, KvCompressionDecisionV1, KvCompressionPolicyV1, KvCompressionStrategyV1,
29    KvDecisionActionV1, KvDecisionReasonV1,
30};
31pub use profile::{
32    KvAxisPolicyV1, KvCompressionProfileV1, KvFallbackModeV1, KvFallbackPolicyV1,
33    KvProtectedPolicyV1, KvQualityBudgetV1,
34};
35pub use quality::{KvAttentionQualityReportV1, KvLayerHeadQualityV1};
36pub use receipt::{
37    kv_tensor_digest, KvCompressionReceiptV1, KvDecodeReceiptV1, KvEvalReceiptV1, KvOperationKindV1,
38};
39pub use shape::{KvAttentionKind, KvDType, KvRole, KvRopeState, KvTensorShapeV1};