kapsl-llm 0.1.0

Large language model inference with GGUF and ONNX backend support for Kapsl
Documentation
1
2
3
4
5
6
7
8
9
10
11
12
13
14
pub mod block_manager;
pub mod engine;
pub mod gguf_backend;
pub mod global_scheduler;
pub mod kv_cache;
pub mod llm_backend;
pub mod llm_metrics;
pub mod model_paths;
pub mod radix_tree;
pub mod rag;
pub mod scheduler;
pub mod sequence;

pub use gguf_backend::GgufBackend;