pub struct HardwareProfile {
pub bandwidth_gb_s: f64,
pub compute_gflops: f64,
pub ops_per_token: f64,
}Expand description
Hardware profile for roofline calculation.
Fields§
§bandwidth_gb_s: f64Effective memory bandwidth in GB/s
compute_gflops: f64Effective compute throughput in GFLOPS
ops_per_token: f64Operations per token (depends on model architecture)
Implementations§
Source§impl HardwareProfile
impl HardwareProfile
Sourcepub fn apple_m_series() -> Self
pub fn apple_m_series() -> Self
Create a profile for Apple M-series (conservative estimates).
Sourcepub fn nvidia_a100() -> Self
pub fn nvidia_a100() -> Self
Create a profile for NVIDIA A100.
Trait Implementations§
Source§impl Clone for HardwareProfile
impl Clone for HardwareProfile
Source§fn clone(&self) -> HardwareProfile
fn clone(&self) -> HardwareProfile
Returns a duplicate of the value. Read more
1.0.0 · Source§fn clone_from(&mut self, source: &Self)
fn clone_from(&mut self, source: &Self)
Performs copy-assignment from
source. Read moreAuto Trait Implementations§
impl Freeze for HardwareProfile
impl RefUnwindSafe for HardwareProfile
impl Send for HardwareProfile
impl Sync for HardwareProfile
impl Unpin for HardwareProfile
impl UnsafeUnpin for HardwareProfile
impl UnwindSafe for HardwareProfile
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Mutably borrows from an owned value. Read more