pub struct PerformanceSnapshot {Show 17 fields
pub timestamp: u64,
pub total_time_ms: f64,
pub memory_usage_mb: f64,
pub peak_memory_mb: f64,
pub gpu_utilization: f64,
pub throughput: f64,
pub batch_size: usize,
pub layer_timings: HashMap<String, f64>,
pub layer_memory: HashMap<String, f64>,
pub hardware_type: Option<HardwareType>,
pub io_wait_pct: Option<f32>,
pub batch_throughput_per_sec: Option<f32>,
pub gpu_peak_throughput: Option<f32>,
pub model_depth: Option<usize>,
pub num_heads: Option<usize>,
pub kv_cache_bytes: Option<u64>,
pub seq_len: Option<usize>,
}Expand description
Performance snapshot for analysis
Fields§
§timestamp: u64Timestamp
total_time_ms: f64Total execution time (ms)
memory_usage_mb: f64Memory usage (MB)
peak_memory_mb: f64Peak memory (MB)
gpu_utilization: f64GPU utilization (0-100)
throughput: f64Throughput (samples/sec)
batch_size: usizeBatch size used
layer_timings: HashMap<String, f64>Layer timings (layer name -> time in ms)
layer_memory: HashMap<String, f64>Memory per layer (layer name -> memory in MB)
hardware_type: Option<HardwareType>Override hardware type for this snapshot (overrides TunerConfig::target_hardware)
io_wait_pct: Option<f32>Fraction of time (0.0-1.0) spent waiting on I/O during this snapshot
batch_throughput_per_sec: Option<f32>Samples processed per second during this snapshot
gpu_peak_throughput: Option<f32>Theoretical peak GPU throughput (samples/sec) for the detected GPU
model_depth: Option<usize>Number of transformer layers in the model
num_heads: Option<usize>Number of attention heads
kv_cache_bytes: Option<u64>Current KV-cache size in bytes
seq_len: Option<usize>Sequence length for this batch
Trait Implementations§
Source§impl Clone for PerformanceSnapshot
impl Clone for PerformanceSnapshot
Source§fn clone(&self) -> PerformanceSnapshot
fn clone(&self) -> PerformanceSnapshot
Returns a duplicate of the value. Read more
1.0.0 · Source§fn clone_from(&mut self, source: &Self)
fn clone_from(&mut self, source: &Self)
Performs copy-assignment from
source. Read moreSource§impl Debug for PerformanceSnapshot
impl Debug for PerformanceSnapshot
Source§impl Default for PerformanceSnapshot
impl Default for PerformanceSnapshot
Source§fn default() -> PerformanceSnapshot
fn default() -> PerformanceSnapshot
Returns the “default value” for a type. Read more
Source§impl<'de> Deserialize<'de> for PerformanceSnapshot
impl<'de> Deserialize<'de> for PerformanceSnapshot
Source§fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where
__D: Deserializer<'de>,
fn deserialize<__D>(__deserializer: __D) -> Result<Self, __D::Error>where
__D: Deserializer<'de>,
Deserialize this value from the given Serde deserializer. Read more
Auto Trait Implementations§
impl Freeze for PerformanceSnapshot
impl RefUnwindSafe for PerformanceSnapshot
impl Send for PerformanceSnapshot
impl Sync for PerformanceSnapshot
impl Unpin for PerformanceSnapshot
impl UnsafeUnpin for PerformanceSnapshot
impl UnwindSafe for PerformanceSnapshot
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more
Source§impl<T> CloneToUninit for Twhere
T: Clone,
impl<T> CloneToUninit for Twhere
T: Clone,
Source§impl<T> ConfigSerializable for Twhere
T: Serialize + for<'de> Deserialize<'de>,
impl<T> ConfigSerializable for Twhere
T: Serialize + for<'de> Deserialize<'de>,
Source§fn save_to_file(&self, path: &Path) -> Result<(), TrustformersError>
fn save_to_file(&self, path: &Path) -> Result<(), TrustformersError>
Save to file
Source§fn load_from_file(path: &Path) -> Result<Self, TrustformersError>where
Self: Sized,
fn load_from_file(path: &Path) -> Result<Self, TrustformersError>where
Self: Sized,
Load from file
Source§impl<T> Instrument for T
impl<T> Instrument for T
Source§fn instrument(self, span: Span) -> Instrumented<Self>
fn instrument(self, span: Span) -> Instrumented<Self>
Source§fn in_current_span(self) -> Instrumented<Self>
fn in_current_span(self) -> Instrumented<Self>
Source§impl<T> IntoEither for T
impl<T> IntoEither for T
Source§fn into_either(self, into_left: bool) -> Either<Self, Self>
fn into_either(self, into_left: bool) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left is true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read moreSource§fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
Converts
self into a Left variant of Either<Self, Self>
if into_left(&self) returns true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read moreSource§impl<T> Pointable for T
impl<T> Pointable for T
Source§impl<T> PolicyExt for Twhere
T: ?Sized,
impl<T> PolicyExt for Twhere
T: ?Sized,
Source§impl<SS, SP> SupersetOf<SS> for SPwhere
SS: SubsetOf<SP>,
impl<SS, SP> SupersetOf<SS> for SPwhere
SS: SubsetOf<SP>,
Source§fn to_subset(&self) -> Option<SS>
fn to_subset(&self) -> Option<SS>
The inverse inclusion map: attempts to construct
self from the equivalent element of its
superset. Read moreSource§fn is_in_subset(&self) -> bool
fn is_in_subset(&self) -> bool
Checks if
self is actually part of its subset T (and can be converted to it).Source§fn to_subset_unchecked(&self) -> SS
fn to_subset_unchecked(&self) -> SS
Use with care! Same as
self.to_subset but without any property checks. Always succeeds.Source§fn from_subset(element: &SS) -> SP
fn from_subset(element: &SS) -> SP
The inclusion map: converts
self to the equivalent element of its superset.