sipp-rs 0.1.0

Unified Rust library for extensible Sipp inference
1
2
3
4
5
6
7
8
9
10
11
12
13
14
pub mod config;
pub(crate) mod inference_runtime;
pub mod llama;
pub mod metrics;
pub(crate) mod numeric;
pub mod request;
mod residency;
pub(crate) mod scheduler;
pub(crate) mod session;

pub use inference_runtime::{InferenceRuntime, RequestStepResult, SchedulerBurstResult};
pub use sipp_sys::{llama_seq_id, llama_token};

pub(crate) const REQUEST_CANCELLED_MESSAGE: &str = "Request cancelled.";