sipp-rs 0.1.0

Unified Rust library for extensible Sipp inference
1
2
3
4
5
6
7
8
9
10
11
mod inference_config;
mod scheduler_policy;

pub use inference_config::{
    CacheRuntimeConfig, ContextRuntimeConfig, FlashAttentionMode, GenerateOptions, GpuLayerConfig,
    KvCacheType, KvReuseMode, LogitBias, ModelPlacementConfig, MultimodalRuntimeConfig,
    NativeRuntimeConfig, ObservabilityRuntimeConfig, ResidencyRuntimeConfig, ResolvedRuntimeLimits,
    RopeScaling, SamplerStage, SamplingRuntimeConfig, SamplingRuntimeOverride,
    SchedulerRuntimeConfig, SplitMode, DEFAULT_CONTEXT_KEY, DEFAULT_MAX_TOKENS,
};
pub use scheduler_policy::{SchedulerPolicyConfig, SchedulerPolicyMode, SchedulerTickBudget};