Skip to main content

ExecutionGraph

Struct ExecutionGraph 

Source
pub struct ExecutionGraph { /* private fields */ }
Expand description

Execution path graph for tracking brick → kernel → PTX relationships.

PAR-201: Captures the full execution hierarchy for profiling analysis.

§Example

use trueno::brick::{ExecutionGraph, ExecutionNode, EdgeType};

let mut graph = ExecutionGraph::new();

// Add layer scope
let layer_id = graph.add_node(ExecutionNode::Layer { index: 0 });

// Add brick within layer
let brick_id = graph.add_node(ExecutionNode::Brick {
    id: BrickId::QkvProjection,
    timing_ns: 1000,
    elements: 4096,
});
graph.add_edge(layer_id, brick_id, EdgeType::Contains);

// Add kernel launched by brick
let kernel_id = graph.add_node(ExecutionNode::Kernel {
    name: "batched_q4k_gemv".into(),
    ptx_hash: 0x7a3b1c2d,
    grid: (32, 1, 1),
    block: (256, 1, 1),
    shared_mem: 4096,
});
graph.add_edge(brick_id, kernel_id, EdgeType::Launches);

// Export to trueno-graph for analysis
#[cfg(feature = "execution-graph")]
let csr = graph.to_csr();

Implementations§

Source§

impl ExecutionGraph

Source

pub fn critical_path(&self) -> (Vec<ExecutionNodeId>, u64)

Compute critical path through execution graph using longest-path algorithm.

Returns (critical_path_nodes, total_time_ns). The critical path represents the longest chain of dependencies that determines total execution time.

Reference: Graham et al. (1979) “Scheduling Algorithms for Multi-Processor Systems”

Source

pub fn compute_slack(&self) -> HashMap<ExecutionNodeId, u64>

Compute slack for each node (how much it can be delayed without affecting total time).

Returns map from node ID to slack in nanoseconds. Nodes on critical path have slack = 0.

Source

pub fn roofline_distance( &self, peak_tflops: f32, peak_bandwidth_gb_s: f32, ) -> HashMap<ExecutionNodeId, f32>

Compute roofline distance for kernel nodes.

Returns map from kernel node ID to distance from roofline (0.0 = optimal). Distance = 1.0 - min(achieved/peak_compute, achieved/peak_bandwidth).

Reference: Williams et al. (2009) “Roofline: An Insightful Visual Performance Model”

Source

pub fn detect_ping_pong(&self) -> Vec<(ExecutionNodeId, ExecutionNodeId)>

Detect ping-pong memory transfer patterns (wasteful H2D followed by D2H).

Returns pairs of transfer node IDs that exhibit ping-pong behavior.

Source

pub fn critical_path_summary(&self) -> String

Get critical path analysis summary as formatted string.

Source§

impl ExecutionGraph

Source

pub fn new() -> Self

Create a new empty execution graph.

Source

pub fn add_node(&mut self, node: ExecutionNode) -> ExecutionNodeId

Add a node to the graph, returning its ID.

Source

pub fn add_edge( &mut self, src: ExecutionNodeId, dst: ExecutionNodeId, edge_type: EdgeType, )

Add an edge between two nodes.

Source

pub fn add_weighted_edge( &mut self, src: ExecutionNodeId, dst: ExecutionNodeId, edge_type: EdgeType, weight: f32, )

Add an edge with a weight.

Source

pub fn push_scope(&mut self, node: ExecutionNode) -> ExecutionNodeId

Push a scope for hierarchical recording. All subsequent nodes will be children of this scope.

Source

pub fn pop_scope(&mut self) -> Option<ExecutionNodeId>

Pop the current scope.

Source

pub fn current_scope(&self) -> Option<ExecutionNodeId>

Get the current scope (if any).

Source

pub fn add_node_in_scope(&mut self, node: ExecutionNode) -> ExecutionNodeId

Add a node under the current scope.

Source

pub fn record_kernel_launch( &mut self, name: &str, ptx_hash: u64, grid: (u32, u32, u32), block: (u32, u32, u32), shared_mem: u32, ) -> ExecutionNodeId

Record a kernel launch under the current scope.

Source

pub fn record_kernel_launch_with_metrics( &mut self, name: &str, ptx_hash: u64, grid: (u32, u32, u32), block: (u32, u32, u32), shared_mem: u32, timing_ns: u64, arithmetic_intensity: f32, achieved_tflops: f32, ) -> ExecutionNodeId

Record a kernel launch with roofline metrics (Phase 9).

Source

pub fn record_transfer( &mut self, src: &str, dst: &str, bytes: u64, direction: TransferDirection, timing_ns: Option<u64>, ) -> ExecutionNodeId

Record a memory transfer (Phase 9: data movement topology).

Source

pub fn add_dependency(&mut self, from: ExecutionNodeId, to: ExecutionNodeId)

Add a dependency edge for critical path analysis (Phase 9).

Source

pub fn node(&self, id: ExecutionNodeId) -> Option<&ExecutionNode>

Get a node by ID.

Source

pub fn node_by_name( &self, name: &str, ) -> Option<(ExecutionNodeId, &ExecutionNode)>

Get a node by name.

Source

pub fn nodes(&self) -> &[ExecutionNode]

Get all nodes.

Source

pub fn edges(&self) -> &[ExecutionEdge]

Get all edges.

Source

pub fn num_nodes(&self) -> usize

Number of nodes.

Source

pub fn num_edges(&self) -> usize

Number of edges.

Source

pub fn outgoing_edges( &self, node: ExecutionNodeId, ) -> impl Iterator<Item = &ExecutionEdge>

Get outgoing edges for a node.

Source

pub fn incoming_edges( &self, node: ExecutionNodeId, ) -> impl Iterator<Item = &ExecutionEdge>

Get incoming edges for a node.

Source

pub fn kernel_nodes( &self, ) -> impl Iterator<Item = (ExecutionNodeId, &ExecutionNode)>

Find all kernel nodes.

Source

pub fn slowest_kernel(&self) -> Option<(ExecutionNodeId, &ExecutionNode, u64)>

Find the slowest kernel (by parent brick timing).

Source

pub fn clear(&mut self)

Clear the graph.

Source

pub fn is_scope_balanced(&self) -> bool

Check if scope stack is balanced (empty).

Source§

impl ExecutionGraph

Source

pub fn to_dot(&self) -> String

Export to DOT format for Graphviz visualization.

Source

pub fn to_csr(&self) -> CsrGraph

Export to trueno-graph CsrGraph format.

Source

pub fn to_tree_node(&self) -> TreeNode

Convert to presentar-terminal TreeNode for TUI visualization.

PAR-201: Renders the execution graph as a collapsible tree in the terminal.

Source

pub fn to_ascii_tree(&self) -> String

Render graph to ASCII tree string (headless mode for testing/automation).

PAR-201: Zero-dependency tree visualization for CI/CD, logging, and snapshot tests.

Trait Implementations§

Source§

impl Debug for ExecutionGraph

Source§

fn fmt(&self, f: &mut Formatter<'_>) -> Result

Formats the value using the given formatter. Read more
Source§

impl Default for ExecutionGraph

Source§

fn default() -> ExecutionGraph

Returns the “default value” for a type. Read more

Auto Trait Implementations§

Blanket Implementations§

Source§

impl<T> Any for T
where T: 'static + ?Sized,

Source§

fn type_id(&self) -> TypeId

Gets the TypeId of self. Read more
Source§

impl<T> Borrow<T> for T
where T: ?Sized,

Source§

fn borrow(&self) -> &T

Immutably borrows from an owned value. Read more
Source§

impl<T> BorrowMut<T> for T
where T: ?Sized,

Source§

fn borrow_mut(&mut self) -> &mut T

Mutably borrows from an owned value. Read more
Source§

impl<T> Conv for T

Source§

fn conv<T>(self) -> T
where Self: Into<T>,

Converts self into T using Into<T>. Read more
Source§

impl<T> Downcast<T> for T

Source§

fn downcast(&self) -> &T

Source§

impl<T> FmtForward for T

Source§

fn fmt_binary(self) -> FmtBinary<Self>
where Self: Binary,

Causes self to use its Binary implementation when Debug-formatted.
Source§

fn fmt_display(self) -> FmtDisplay<Self>
where Self: Display,

Causes self to use its Display implementation when Debug-formatted.
Source§

fn fmt_lower_exp(self) -> FmtLowerExp<Self>
where Self: LowerExp,

Causes self to use its LowerExp implementation when Debug-formatted.
Source§

fn fmt_lower_hex(self) -> FmtLowerHex<Self>
where Self: LowerHex,

Causes self to use its LowerHex implementation when Debug-formatted.
Source§

fn fmt_octal(self) -> FmtOctal<Self>
where Self: Octal,

Causes self to use its Octal implementation when Debug-formatted.
Source§

fn fmt_pointer(self) -> FmtPointer<Self>
where Self: Pointer,

Causes self to use its Pointer implementation when Debug-formatted.
Source§

fn fmt_upper_exp(self) -> FmtUpperExp<Self>
where Self: UpperExp,

Causes self to use its UpperExp implementation when Debug-formatted.
Source§

fn fmt_upper_hex(self) -> FmtUpperHex<Self>
where Self: UpperHex,

Causes self to use its UpperHex implementation when Debug-formatted.
Source§

fn fmt_list(self) -> FmtList<Self>
where &'a Self: for<'a> IntoIterator,

Formats each item in a sequence. Read more
Source§

impl<T> From<T> for T

Source§

fn from(t: T) -> T

Returns the argument unchanged.

Source§

impl<T> Instrument for T

Source§

fn instrument(self, span: Span) -> Instrumented<Self>

Instruments this type with the provided Span, returning an Instrumented wrapper. Read more
Source§

fn in_current_span(self) -> Instrumented<Self>

Instruments this type with the current Span, returning an Instrumented wrapper. Read more
Source§

impl<T, U> Into<U> for T
where U: From<T>,

Source§

fn into(self) -> U

Calls U::from(self).

That is, this conversion is whatever the implementation of From<T> for U chooses to do.

Source§

impl<T> IntoEither for T

Source§

fn into_either(self, into_left: bool) -> Either<Self, Self>

Converts self into a Left variant of Either<Self, Self> if into_left is true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more
Source§

fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
where F: FnOnce(&Self) -> bool,

Converts self into a Left variant of Either<Self, Self> if into_left(&self) returns true. Converts self into a Right variant of Either<Self, Self> otherwise. Read more
Source§

impl<T> Pipe for T
where T: ?Sized,

Source§

fn pipe<R>(self, func: impl FnOnce(Self) -> R) -> R
where Self: Sized,

Pipes by value. This is generally the method you want to use. Read more
Source§

fn pipe_ref<'a, R>(&'a self, func: impl FnOnce(&'a Self) -> R) -> R
where R: 'a,

Borrows self and passes that borrow into the pipe function. Read more
Source§

fn pipe_ref_mut<'a, R>(&'a mut self, func: impl FnOnce(&'a mut Self) -> R) -> R
where R: 'a,

Mutably borrows self and passes that borrow into the pipe function. Read more
Source§

fn pipe_borrow<'a, B, R>(&'a self, func: impl FnOnce(&'a B) -> R) -> R
where Self: Borrow<B>, B: 'a + ?Sized, R: 'a,

Borrows self, then passes self.borrow() into the pipe function. Read more
Source§

fn pipe_borrow_mut<'a, B, R>( &'a mut self, func: impl FnOnce(&'a mut B) -> R, ) -> R
where Self: BorrowMut<B>, B: 'a + ?Sized, R: 'a,

Mutably borrows self, then passes self.borrow_mut() into the pipe function. Read more
Source§

fn pipe_as_ref<'a, U, R>(&'a self, func: impl FnOnce(&'a U) -> R) -> R
where Self: AsRef<U>, U: 'a + ?Sized, R: 'a,

Borrows self, then passes self.as_ref() into the pipe function.
Source§

fn pipe_as_mut<'a, U, R>(&'a mut self, func: impl FnOnce(&'a mut U) -> R) -> R
where Self: AsMut<U>, U: 'a + ?Sized, R: 'a,

Mutably borrows self, then passes self.as_mut() into the pipe function.
Source§

fn pipe_deref<'a, T, R>(&'a self, func: impl FnOnce(&'a T) -> R) -> R
where Self: Deref<Target = T>, T: 'a + ?Sized, R: 'a,

Borrows self, then passes self.deref() into the pipe function.
Source§

fn pipe_deref_mut<'a, T, R>( &'a mut self, func: impl FnOnce(&'a mut T) -> R, ) -> R
where Self: DerefMut<Target = T> + Deref, T: 'a + ?Sized, R: 'a,

Mutably borrows self, then passes self.deref_mut() into the pipe function.
Source§

impl<T> Pointable for T

Source§

const ALIGN: usize

The alignment of pointer.
Source§

type Init = T

The type for initializers.
Source§

unsafe fn init(init: <T as Pointable>::Init) -> usize

Initializes a with the given initializer. Read more
Source§

unsafe fn deref<'a>(ptr: usize) -> &'a T

Dereferences the given pointer. Read more
Source§

unsafe fn deref_mut<'a>(ptr: usize) -> &'a mut T

Mutably dereferences the given pointer. Read more
Source§

unsafe fn drop(ptr: usize)

Drops the object pointed to by the given pointer. Read more
Source§

impl<T> Tap for T

Source§

fn tap(self, func: impl FnOnce(&Self)) -> Self

Immutable access to a value. Read more
Source§

fn tap_mut(self, func: impl FnOnce(&mut Self)) -> Self

Mutable access to a value. Read more
Source§

fn tap_borrow<B>(self, func: impl FnOnce(&B)) -> Self
where Self: Borrow<B>, B: ?Sized,

Immutable access to the Borrow<B> of a value. Read more
Source§

fn tap_borrow_mut<B>(self, func: impl FnOnce(&mut B)) -> Self
where Self: BorrowMut<B>, B: ?Sized,

Mutable access to the BorrowMut<B> of a value. Read more
Source§

fn tap_ref<R>(self, func: impl FnOnce(&R)) -> Self
where Self: AsRef<R>, R: ?Sized,

Immutable access to the AsRef<R> view of a value. Read more
Source§

fn tap_ref_mut<R>(self, func: impl FnOnce(&mut R)) -> Self
where Self: AsMut<R>, R: ?Sized,

Mutable access to the AsMut<R> view of a value. Read more
Source§

fn tap_deref<T>(self, func: impl FnOnce(&T)) -> Self
where Self: Deref<Target = T>, T: ?Sized,

Immutable access to the Deref::Target of a value. Read more
Source§

fn tap_deref_mut<T>(self, func: impl FnOnce(&mut T)) -> Self
where Self: DerefMut<Target = T> + Deref, T: ?Sized,

Mutable access to the Deref::Target of a value. Read more
Source§

fn tap_dbg(self, func: impl FnOnce(&Self)) -> Self

Calls .tap() only in debug builds, and is erased in release builds.
Source§

fn tap_mut_dbg(self, func: impl FnOnce(&mut Self)) -> Self

Calls .tap_mut() only in debug builds, and is erased in release builds.
Source§

fn tap_borrow_dbg<B>(self, func: impl FnOnce(&B)) -> Self
where Self: Borrow<B>, B: ?Sized,

Calls .tap_borrow() only in debug builds, and is erased in release builds.
Source§

fn tap_borrow_mut_dbg<B>(self, func: impl FnOnce(&mut B)) -> Self
where Self: BorrowMut<B>, B: ?Sized,

Calls .tap_borrow_mut() only in debug builds, and is erased in release builds.
Source§

fn tap_ref_dbg<R>(self, func: impl FnOnce(&R)) -> Self
where Self: AsRef<R>, R: ?Sized,

Calls .tap_ref() only in debug builds, and is erased in release builds.
Source§

fn tap_ref_mut_dbg<R>(self, func: impl FnOnce(&mut R)) -> Self
where Self: AsMut<R>, R: ?Sized,

Calls .tap_ref_mut() only in debug builds, and is erased in release builds.
Source§

fn tap_deref_dbg<T>(self, func: impl FnOnce(&T)) -> Self
where Self: Deref<Target = T>, T: ?Sized,

Calls .tap_deref() only in debug builds, and is erased in release builds.
Source§

fn tap_deref_mut_dbg<T>(self, func: impl FnOnce(&mut T)) -> Self
where Self: DerefMut<Target = T> + Deref, T: ?Sized,

Calls .tap_deref_mut() only in debug builds, and is erased in release builds.
Source§

impl<T> TryConv for T

Source§

fn try_conv<T>(self) -> Result<T, Self::Error>
where Self: TryInto<T>,

Attempts to convert self into T using TryInto<T>. Read more
Source§

impl<T, U> TryFrom<U> for T
where U: Into<T>,

Source§

type Error = Infallible

The type returned in the event of a conversion error.
Source§

fn try_from(value: U) -> Result<T, <T as TryFrom<U>>::Error>

Performs the conversion.
Source§

impl<T, U> TryInto<U> for T
where U: TryFrom<T>,

Source§

type Error = <U as TryFrom<T>>::Error

The type returned in the event of a conversion error.
Source§

fn try_into(self) -> Result<U, <U as TryFrom<T>>::Error>

Performs the conversion.
Source§

impl<T> Upcast<T> for T

Source§

fn upcast(&self) -> Option<&T>

Source§

impl<V, T> VZip<V> for T
where V: MultiLane<T>,

Source§

fn vzip(self) -> V

Source§

impl<T> WithSubscriber for T

Source§

fn with_subscriber<S>(self, subscriber: S) -> WithDispatch<Self>
where S: Into<Dispatch>,

Attaches the provided Subscriber to this type, returning a WithDispatch wrapper. Read more
Source§

fn with_current_subscriber(self) -> WithDispatch<Self>

Attaches the current default Subscriber to this type, returning a WithDispatch wrapper. Read more
Source§

impl<T> Allocation for T
where T: RefUnwindSafe + Send + Sync,

Source§

impl<T> WasmNotSend for T
where T: Send,

Source§

impl<T> WasmNotSendSync for T

Source§

impl<T> WasmNotSync for T
where T: Sync,