pub struct RealtimeConfig {
pub latency_target_ms: f32,
pub throughput_target_tps: f32,
pub min_batch_size: usize,
pub max_batch_size: usize,
pub kv_cache_pressure_threshold: f32,
pub enable_speculative: bool,
pub speculative: SpeculativeConfig,
pub batch_strategy: BatchSizeStrategy,
pub kv_policy: KvCachePressurePolicy,
pub max_memory_bytes: usize,
pub optimization_interval_ms: u64,
}Expand description
Configuration for the realtime optimizer
Fields§
§latency_target_ms: f32Target latency for TTFT (milliseconds)
throughput_target_tps: f32Target throughput (tokens per second)
min_batch_size: usizeMinimum batch size
max_batch_size: usizeMaximum batch size
kv_cache_pressure_threshold: f32KV cache pressure threshold (0.0 - 1.0)
enable_speculative: boolEnable speculative decoding
speculative: SpeculativeConfigSpeculative decoding configuration
batch_strategy: BatchSizeStrategyBatch sizing strategy
kv_policy: KvCachePressurePolicyKV cache pressure policy
max_memory_bytes: usizeMaximum memory budget (bytes)
optimization_interval_ms: u64Optimization interval (how often to recompute decisions)
Trait Implementations§
Source§impl Clone for RealtimeConfig
impl Clone for RealtimeConfig
Source§fn clone(&self) -> RealtimeConfig
fn clone(&self) -> RealtimeConfig
Returns a duplicate of the value. Read more
1.0.0 · Source§fn clone_from(&mut self, source: &Self)
fn clone_from(&mut self, source: &Self)
Performs copy-assignment from
source. Read moreSource§impl Debug for RealtimeConfig
impl Debug for RealtimeConfig
Source§impl Default for RealtimeConfig
impl Default for RealtimeConfig
Source§impl<'de> Deserialize<'de> for RealtimeConfig
impl<'de> Deserialize<'de> for RealtimeConfig
Source§fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where
__D: Deserializer<'de>,
fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where
__D: Deserializer<'de>,
Deserialize this value from the given Serde deserializer. Read more
Auto Trait Implementations§
impl Freeze for RealtimeConfig
impl RefUnwindSafe for RealtimeConfig
impl Send for RealtimeConfig
impl Sync for RealtimeConfig
impl Unpin for RealtimeConfig
impl UnsafeUnpin for RealtimeConfig
impl UnwindSafe for RealtimeConfig
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more
Source§impl<T> CloneToUninit for Twhere
T: Clone,
impl<T> CloneToUninit for Twhere
T: Clone,
Source§impl<T> Instrument for T
impl<T> Instrument for T
Source§fn instrument(self, span: Span) -> Instrumented<Self>
fn instrument(self, span: Span) -> Instrumented<Self>
Source§fn in_current_span(self) -> Instrumented<Self>
fn in_current_span(self) -> Instrumented<Self>
Source§impl<T> IntoEither for T
impl<T> IntoEither for T
Source§fn into_either(self, into_left: bool) -> Either<Self, Self>
fn into_either(self, into_left: bool) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left is true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read moreSource§fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left(&self) returns true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read more