Struct ComputeEngine

Source

pub struct ComputeEngine { /* private fields */ }

Implementations§

Source §

impl ComputeEngine

Source

pub fn new(hardware: HardwareConfig, model: ModelConfig) -> Self

Source

pub fn calculate_iteration_time( &self, batch_requests: &[&Request], tokens_per_request: &[u32], ) -> f64

Calculate time to process an iteration (in seconds) Takes batch of requests and number of tokens to process for each Returns max(compute_time, memory_time) since they happen in parallel

Source

pub fn calculate_flops_utilization( &self, batch_requests: &[&Request], tokens_per_request: &[u32], actual_time: f64, ) -> f64

Calculate FLOPS utilization for this iteration (0.0 to 1.0)

Source

pub fn calculate_bandwidth_utilization( &self, bytes_transferred: f64, actual_time: f64, ) -> f64

Calculate memory bandwidth utilization for this iteration (0.0 to 1.0)

Source

pub fn calculate_bytes_transferred( &self, batch_requests: &[&Request], tokens_per_request: &[u32], ) -> f64

Calculate total bytes transferred for a batch of requests

Auto Trait Implementations§

§

impl UnwindSafe for ComputeEngine

Blanket Implementations§

Source §

impl<T> Any for T
where T: 'static + ?Sized,

Source §

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more

Source §

impl<T> Borrow<T> for T
where T: ?Sized,

Source §

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more

Source §

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source §

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more

Source §

impl<T> From<T> for T

Source §

fn from(t: T) -> T

Returns the argument unchanged.

Source §

impl<T, U> Into for T
where U: From<T>,

Source §

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source §

impl<T, U> TryFrom for T
where U: Into<T>,

Source §

type Error = Infallible

The type returned in the event of a conversion error.

Source §

fn try_from(value: U) -> Result<T, <T as TryFrom>::Error>

Performs the conversion.

Source §

impl<T, U> TryInto for T
where U: TryFrom<T>,

Source §

type Error = >::Error

The type returned in the event of a conversion error.

Source §

fn try_into(self) -> Result<U, >::Error>

Performs the conversion.

Source §

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

Source §

ComputeEngine

Struct ComputeEngine

Implementations§

impl ComputeEngine

pub fn new(hardware: HardwareConfig, model: ModelConfig) -> Self

pub fn calculate_iteration_time( &self, batch_requests: &[&Request], tokens_per_request: &[u32], ) -> f64

pub fn calculate_flops_utilization( &self, batch_requests: &[&Request], tokens_per_request: &[u32], actual_time: f64, ) -> f64

pub fn calculate_bandwidth_utilization( &self, bytes_transferred: f64, actual_time: f64, ) -> f64

pub fn calculate_bytes_transferred( &self, batch_requests: &[&Request], tokens_per_request: &[u32], ) -> f64

Auto Trait Implementations§

impl Freeze for ComputeEngine

impl RefUnwindSafe for ComputeEngine

impl Send for ComputeEngine

impl Sync for ComputeEngine

impl Unpin for ComputeEngine

impl UnsafeUnpin for ComputeEngine

impl UnwindSafe for ComputeEngine

Blanket Implementations§

impl<T> Any for T
where T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for T
where T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for T
where T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for T
where U: From<T>,

fn into(self) -> U

impl<T, U> TryFrom<U> for T
where U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

fn vzip(self) -> V

ComputeEngine

Struct ComputeEngine Copy item path

Implementations§

impl ComputeEngine

pub fn new(hardware: HardwareConfig, model: ModelConfig) -> Self

pub fn calculate_iteration_time( &self, batch_requests: &[&Request], tokens_per_request: &[u32], ) -> f64

pub fn calculate_flops_utilization( &self, batch_requests: &[&Request], tokens_per_request: &[u32], actual_time: f64, ) -> f64

pub fn calculate_bandwidth_utilization( &self, bytes_transferred: f64, actual_time: f64, ) -> f64

pub fn calculate_bytes_transferred( &self, batch_requests: &[&Request], tokens_per_request: &[u32], ) -> f64

Auto Trait Implementations§

impl Freeze for ComputeEngine

impl RefUnwindSafe for ComputeEngine

impl Send for ComputeEngine

impl Sync for ComputeEngine

impl Unpin for ComputeEngine

impl UnsafeUnpin for ComputeEngine

impl UnwindSafe for ComputeEngine

Blanket Implementations§

impl<T> Any for Twhere T: 'static + ?Sized,

fn type_id(&self) -> TypeId

impl<T> Borrow<T> for Twhere T: ?Sized,

fn borrow(&self) -> &T

impl<T> BorrowMut<T> for Twhere T: ?Sized,

fn borrow_mut(&mut self) -> &mut T

impl<T> From<T> for T

fn from(t: T) -> T

impl<T, U> Into<U> for Twhere U: From<T>,

fn into(self) -> U

impl<T, U> TryFrom<U> for Twhere U: Into<T>,

type Error = Infallible

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

impl<T, U> TryInto<U> for Twhere U: TryFrom<T>,

type Error = <U as TryFrom<T>>::Error

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

impl<V, T> VZip<V> for Twhere V: MultiLane<T>,

fn vzip(self) -> V

Struct ComputeEngine

impl<T> Any for T
where T: 'static + ?Sized,

impl<T> Borrow<T> for T
where T: ?Sized,

impl<T> BorrowMut<T> for T
where T: ?Sized,

impl<T, U> Into<U> for T
where U: From<T>,

impl<T, U> TryFrom<U> for T
where U: Into<T>,

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

impl<V, T> VZip<V> for T
where V: MultiLane<T>,