pub struct ExecutionGraph { /* private fields */ }Expand description
Execution path graph for tracking brick → kernel → PTX relationships.
PAR-201: Captures the full execution hierarchy for profiling analysis.
§Example
use trueno::brick::{ExecutionGraph, ExecutionNode, EdgeType};
let mut graph = ExecutionGraph::new();
// Add layer scope
let layer_id = graph.add_node(ExecutionNode::Layer { index: 0 });
// Add brick within layer
let brick_id = graph.add_node(ExecutionNode::Brick {
id: BrickId::QkvProjection,
timing_ns: 1000,
elements: 4096,
});
graph.add_edge(layer_id, brick_id, EdgeType::Contains);
// Add kernel launched by brick
let kernel_id = graph.add_node(ExecutionNode::Kernel {
name: "batched_q4k_gemv".into(),
ptx_hash: 0x7a3b1c2d,
grid: (32, 1, 1),
block: (256, 1, 1),
shared_mem: 4096,
});
graph.add_edge(brick_id, kernel_id, EdgeType::Launches);
// Export to trueno-graph for analysis
#[cfg(feature = "execution-graph")]
let csr = graph.to_csr();Implementations§
Source§impl ExecutionGraph
impl ExecutionGraph
Sourcepub fn critical_path(&self) -> (Vec<ExecutionNodeId>, u64)
pub fn critical_path(&self) -> (Vec<ExecutionNodeId>, u64)
Compute critical path through execution graph using longest-path algorithm.
Returns (critical_path_nodes, total_time_ns). The critical path represents the longest chain of dependencies that determines total execution time.
Reference: Graham et al. (1979) “Scheduling Algorithms for Multi-Processor Systems”
Sourcepub fn compute_slack(&self) -> HashMap<ExecutionNodeId, u64>
pub fn compute_slack(&self) -> HashMap<ExecutionNodeId, u64>
Compute slack for each node (how much it can be delayed without affecting total time).
Returns map from node ID to slack in nanoseconds. Nodes on critical path have slack = 0.
Sourcepub fn roofline_distance(
&self,
peak_tflops: f32,
peak_bandwidth_gb_s: f32,
) -> HashMap<ExecutionNodeId, f32>
pub fn roofline_distance( &self, peak_tflops: f32, peak_bandwidth_gb_s: f32, ) -> HashMap<ExecutionNodeId, f32>
Compute roofline distance for kernel nodes.
Returns map from kernel node ID to distance from roofline (0.0 = optimal). Distance = 1.0 - min(achieved/peak_compute, achieved/peak_bandwidth).
Reference: Williams et al. (2009) “Roofline: An Insightful Visual Performance Model”
Sourcepub fn detect_ping_pong(&self) -> Vec<(ExecutionNodeId, ExecutionNodeId)>
pub fn detect_ping_pong(&self) -> Vec<(ExecutionNodeId, ExecutionNodeId)>
Detect ping-pong memory transfer patterns (wasteful H2D followed by D2H).
Returns pairs of transfer node IDs that exhibit ping-pong behavior.
Sourcepub fn critical_path_summary(&self) -> String
pub fn critical_path_summary(&self) -> String
Get critical path analysis summary as formatted string.
Source§impl ExecutionGraph
impl ExecutionGraph
Sourcepub fn add_node(&mut self, node: ExecutionNode) -> ExecutionNodeId
pub fn add_node(&mut self, node: ExecutionNode) -> ExecutionNodeId
Add a node to the graph, returning its ID.
Sourcepub fn add_edge(
&mut self,
src: ExecutionNodeId,
dst: ExecutionNodeId,
edge_type: EdgeType,
)
pub fn add_edge( &mut self, src: ExecutionNodeId, dst: ExecutionNodeId, edge_type: EdgeType, )
Add an edge between two nodes.
Sourcepub fn add_weighted_edge(
&mut self,
src: ExecutionNodeId,
dst: ExecutionNodeId,
edge_type: EdgeType,
weight: f32,
)
pub fn add_weighted_edge( &mut self, src: ExecutionNodeId, dst: ExecutionNodeId, edge_type: EdgeType, weight: f32, )
Add an edge with a weight.
Sourcepub fn push_scope(&mut self, node: ExecutionNode) -> ExecutionNodeId
pub fn push_scope(&mut self, node: ExecutionNode) -> ExecutionNodeId
Push a scope for hierarchical recording. All subsequent nodes will be children of this scope.
Sourcepub fn pop_scope(&mut self) -> Option<ExecutionNodeId>
pub fn pop_scope(&mut self) -> Option<ExecutionNodeId>
Pop the current scope.
Sourcepub fn current_scope(&self) -> Option<ExecutionNodeId>
pub fn current_scope(&self) -> Option<ExecutionNodeId>
Get the current scope (if any).
Sourcepub fn add_node_in_scope(&mut self, node: ExecutionNode) -> ExecutionNodeId
pub fn add_node_in_scope(&mut self, node: ExecutionNode) -> ExecutionNodeId
Add a node under the current scope.
Sourcepub fn record_kernel_launch(
&mut self,
name: &str,
ptx_hash: u64,
grid: (u32, u32, u32),
block: (u32, u32, u32),
shared_mem: u32,
) -> ExecutionNodeId
pub fn record_kernel_launch( &mut self, name: &str, ptx_hash: u64, grid: (u32, u32, u32), block: (u32, u32, u32), shared_mem: u32, ) -> ExecutionNodeId
Record a kernel launch under the current scope.
Sourcepub fn record_kernel_launch_with_metrics(
&mut self,
name: &str,
ptx_hash: u64,
grid: (u32, u32, u32),
block: (u32, u32, u32),
shared_mem: u32,
timing_ns: u64,
arithmetic_intensity: f32,
achieved_tflops: f32,
) -> ExecutionNodeId
pub fn record_kernel_launch_with_metrics( &mut self, name: &str, ptx_hash: u64, grid: (u32, u32, u32), block: (u32, u32, u32), shared_mem: u32, timing_ns: u64, arithmetic_intensity: f32, achieved_tflops: f32, ) -> ExecutionNodeId
Record a kernel launch with roofline metrics (Phase 9).
Sourcepub fn record_transfer(
&mut self,
src: &str,
dst: &str,
bytes: u64,
direction: TransferDirection,
timing_ns: Option<u64>,
) -> ExecutionNodeId
pub fn record_transfer( &mut self, src: &str, dst: &str, bytes: u64, direction: TransferDirection, timing_ns: Option<u64>, ) -> ExecutionNodeId
Record a memory transfer (Phase 9: data movement topology).
Sourcepub fn add_dependency(&mut self, from: ExecutionNodeId, to: ExecutionNodeId)
pub fn add_dependency(&mut self, from: ExecutionNodeId, to: ExecutionNodeId)
Add a dependency edge for critical path analysis (Phase 9).
Sourcepub fn node(&self, id: ExecutionNodeId) -> Option<&ExecutionNode>
pub fn node(&self, id: ExecutionNodeId) -> Option<&ExecutionNode>
Get a node by ID.
Sourcepub fn node_by_name(
&self,
name: &str,
) -> Option<(ExecutionNodeId, &ExecutionNode)>
pub fn node_by_name( &self, name: &str, ) -> Option<(ExecutionNodeId, &ExecutionNode)>
Get a node by name.
Sourcepub fn nodes(&self) -> &[ExecutionNode]
pub fn nodes(&self) -> &[ExecutionNode]
Get all nodes.
Sourcepub fn edges(&self) -> &[ExecutionEdge]
pub fn edges(&self) -> &[ExecutionEdge]
Get all edges.
Sourcepub fn outgoing_edges(
&self,
node: ExecutionNodeId,
) -> impl Iterator<Item = &ExecutionEdge>
pub fn outgoing_edges( &self, node: ExecutionNodeId, ) -> impl Iterator<Item = &ExecutionEdge>
Get outgoing edges for a node.
Sourcepub fn incoming_edges(
&self,
node: ExecutionNodeId,
) -> impl Iterator<Item = &ExecutionEdge>
pub fn incoming_edges( &self, node: ExecutionNodeId, ) -> impl Iterator<Item = &ExecutionEdge>
Get incoming edges for a node.
Sourcepub fn kernel_nodes(
&self,
) -> impl Iterator<Item = (ExecutionNodeId, &ExecutionNode)>
pub fn kernel_nodes( &self, ) -> impl Iterator<Item = (ExecutionNodeId, &ExecutionNode)>
Find all kernel nodes.
Sourcepub fn slowest_kernel(&self) -> Option<(ExecutionNodeId, &ExecutionNode, u64)>
pub fn slowest_kernel(&self) -> Option<(ExecutionNodeId, &ExecutionNode, u64)>
Find the slowest kernel (by parent brick timing).
Sourcepub fn is_scope_balanced(&self) -> bool
pub fn is_scope_balanced(&self) -> bool
Check if scope stack is balanced (empty).
Source§impl ExecutionGraph
impl ExecutionGraph
Sourcepub fn to_tree_node(&self) -> TreeNode
pub fn to_tree_node(&self) -> TreeNode
Convert to presentar-terminal TreeNode for TUI visualization.
PAR-201: Renders the execution graph as a collapsible tree in the terminal.
Sourcepub fn to_ascii_tree(&self) -> String
pub fn to_ascii_tree(&self) -> String
Render graph to ASCII tree string (headless mode for testing/automation).
PAR-201: Zero-dependency tree visualization for CI/CD, logging, and snapshot tests.
Trait Implementations§
Source§impl Debug for ExecutionGraph
impl Debug for ExecutionGraph
Source§impl Default for ExecutionGraph
impl Default for ExecutionGraph
Source§fn default() -> ExecutionGraph
fn default() -> ExecutionGraph
Auto Trait Implementations§
impl Freeze for ExecutionGraph
impl RefUnwindSafe for ExecutionGraph
impl Send for ExecutionGraph
impl Sync for ExecutionGraph
impl Unpin for ExecutionGraph
impl UnsafeUnpin for ExecutionGraph
impl UnwindSafe for ExecutionGraph
Blanket Implementations§
Source§impl<T> BorrowMut<T> for Twhere
T: ?Sized,
impl<T> BorrowMut<T> for Twhere
T: ?Sized,
Source§fn borrow_mut(&mut self) -> &mut T
fn borrow_mut(&mut self) -> &mut T
Source§impl<T> FmtForward for T
impl<T> FmtForward for T
Source§fn fmt_binary(self) -> FmtBinary<Self>where
Self: Binary,
fn fmt_binary(self) -> FmtBinary<Self>where
Self: Binary,
self to use its Binary implementation when Debug-formatted.Source§fn fmt_display(self) -> FmtDisplay<Self>where
Self: Display,
fn fmt_display(self) -> FmtDisplay<Self>where
Self: Display,
self to use its Display implementation when
Debug-formatted.Source§fn fmt_lower_exp(self) -> FmtLowerExp<Self>where
Self: LowerExp,
fn fmt_lower_exp(self) -> FmtLowerExp<Self>where
Self: LowerExp,
self to use its LowerExp implementation when
Debug-formatted.Source§fn fmt_lower_hex(self) -> FmtLowerHex<Self>where
Self: LowerHex,
fn fmt_lower_hex(self) -> FmtLowerHex<Self>where
Self: LowerHex,
self to use its LowerHex implementation when
Debug-formatted.Source§fn fmt_octal(self) -> FmtOctal<Self>where
Self: Octal,
fn fmt_octal(self) -> FmtOctal<Self>where
Self: Octal,
self to use its Octal implementation when Debug-formatted.Source§fn fmt_pointer(self) -> FmtPointer<Self>where
Self: Pointer,
fn fmt_pointer(self) -> FmtPointer<Self>where
Self: Pointer,
self to use its Pointer implementation when
Debug-formatted.Source§fn fmt_upper_exp(self) -> FmtUpperExp<Self>where
Self: UpperExp,
fn fmt_upper_exp(self) -> FmtUpperExp<Self>where
Self: UpperExp,
self to use its UpperExp implementation when
Debug-formatted.Source§fn fmt_upper_hex(self) -> FmtUpperHex<Self>where
Self: UpperHex,
fn fmt_upper_hex(self) -> FmtUpperHex<Self>where
Self: UpperHex,
self to use its UpperHex implementation when
Debug-formatted.Source§impl<T> Instrument for T
impl<T> Instrument for T
Source§fn instrument(self, span: Span) -> Instrumented<Self>
fn instrument(self, span: Span) -> Instrumented<Self>
Source§fn in_current_span(self) -> Instrumented<Self>
fn in_current_span(self) -> Instrumented<Self>
Source§impl<T> IntoEither for T
impl<T> IntoEither for T
Source§fn into_either(self, into_left: bool) -> Either<Self, Self>
fn into_either(self, into_left: bool) -> Either<Self, Self>
self into a Left variant of Either<Self, Self>
if into_left is true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read moreSource§fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
fn into_either_with<F>(self, into_left: F) -> Either<Self, Self>
self into a Left variant of Either<Self, Self>
if into_left(&self) returns true.
Converts self into a Right variant of Either<Self, Self>
otherwise. Read moreSource§impl<T> Pipe for Twhere
T: ?Sized,
impl<T> Pipe for Twhere
T: ?Sized,
Source§fn pipe<R>(self, func: impl FnOnce(Self) -> R) -> Rwhere
Self: Sized,
fn pipe<R>(self, func: impl FnOnce(Self) -> R) -> Rwhere
Self: Sized,
Source§fn pipe_ref<'a, R>(&'a self, func: impl FnOnce(&'a Self) -> R) -> Rwhere
R: 'a,
fn pipe_ref<'a, R>(&'a self, func: impl FnOnce(&'a Self) -> R) -> Rwhere
R: 'a,
self and passes that borrow into the pipe function. Read moreSource§fn pipe_ref_mut<'a, R>(&'a mut self, func: impl FnOnce(&'a mut Self) -> R) -> Rwhere
R: 'a,
fn pipe_ref_mut<'a, R>(&'a mut self, func: impl FnOnce(&'a mut Self) -> R) -> Rwhere
R: 'a,
self and passes that borrow into the pipe function. Read moreSource§fn pipe_borrow<'a, B, R>(&'a self, func: impl FnOnce(&'a B) -> R) -> R
fn pipe_borrow<'a, B, R>(&'a self, func: impl FnOnce(&'a B) -> R) -> R
Source§fn pipe_borrow_mut<'a, B, R>(
&'a mut self,
func: impl FnOnce(&'a mut B) -> R,
) -> R
fn pipe_borrow_mut<'a, B, R>( &'a mut self, func: impl FnOnce(&'a mut B) -> R, ) -> R
Source§fn pipe_as_ref<'a, U, R>(&'a self, func: impl FnOnce(&'a U) -> R) -> R
fn pipe_as_ref<'a, U, R>(&'a self, func: impl FnOnce(&'a U) -> R) -> R
self, then passes self.as_ref() into the pipe function.Source§fn pipe_as_mut<'a, U, R>(&'a mut self, func: impl FnOnce(&'a mut U) -> R) -> R
fn pipe_as_mut<'a, U, R>(&'a mut self, func: impl FnOnce(&'a mut U) -> R) -> R
self, then passes self.as_mut() into the pipe
function.Source§fn pipe_deref<'a, T, R>(&'a self, func: impl FnOnce(&'a T) -> R) -> R
fn pipe_deref<'a, T, R>(&'a self, func: impl FnOnce(&'a T) -> R) -> R
self, then passes self.deref() into the pipe function.Source§impl<T> Pointable for T
impl<T> Pointable for T
Source§impl<T> Tap for T
impl<T> Tap for T
Source§fn tap_borrow<B>(self, func: impl FnOnce(&B)) -> Self
fn tap_borrow<B>(self, func: impl FnOnce(&B)) -> Self
Borrow<B> of a value. Read moreSource§fn tap_borrow_mut<B>(self, func: impl FnOnce(&mut B)) -> Self
fn tap_borrow_mut<B>(self, func: impl FnOnce(&mut B)) -> Self
BorrowMut<B> of a value. Read moreSource§fn tap_ref<R>(self, func: impl FnOnce(&R)) -> Self
fn tap_ref<R>(self, func: impl FnOnce(&R)) -> Self
AsRef<R> view of a value. Read moreSource§fn tap_ref_mut<R>(self, func: impl FnOnce(&mut R)) -> Self
fn tap_ref_mut<R>(self, func: impl FnOnce(&mut R)) -> Self
AsMut<R> view of a value. Read moreSource§fn tap_deref<T>(self, func: impl FnOnce(&T)) -> Self
fn tap_deref<T>(self, func: impl FnOnce(&T)) -> Self
Deref::Target of a value. Read moreSource§fn tap_deref_mut<T>(self, func: impl FnOnce(&mut T)) -> Self
fn tap_deref_mut<T>(self, func: impl FnOnce(&mut T)) -> Self
Deref::Target of a value. Read moreSource§fn tap_dbg(self, func: impl FnOnce(&Self)) -> Self
fn tap_dbg(self, func: impl FnOnce(&Self)) -> Self
.tap() only in debug builds, and is erased in release builds.Source§fn tap_mut_dbg(self, func: impl FnOnce(&mut Self)) -> Self
fn tap_mut_dbg(self, func: impl FnOnce(&mut Self)) -> Self
.tap_mut() only in debug builds, and is erased in release
builds.Source§fn tap_borrow_dbg<B>(self, func: impl FnOnce(&B)) -> Self
fn tap_borrow_dbg<B>(self, func: impl FnOnce(&B)) -> Self
.tap_borrow() only in debug builds, and is erased in release
builds.Source§fn tap_borrow_mut_dbg<B>(self, func: impl FnOnce(&mut B)) -> Self
fn tap_borrow_mut_dbg<B>(self, func: impl FnOnce(&mut B)) -> Self
.tap_borrow_mut() only in debug builds, and is erased in release
builds.Source§fn tap_ref_dbg<R>(self, func: impl FnOnce(&R)) -> Self
fn tap_ref_dbg<R>(self, func: impl FnOnce(&R)) -> Self
.tap_ref() only in debug builds, and is erased in release
builds.Source§fn tap_ref_mut_dbg<R>(self, func: impl FnOnce(&mut R)) -> Self
fn tap_ref_mut_dbg<R>(self, func: impl FnOnce(&mut R)) -> Self
.tap_ref_mut() only in debug builds, and is erased in release
builds.Source§fn tap_deref_dbg<T>(self, func: impl FnOnce(&T)) -> Self
fn tap_deref_dbg<T>(self, func: impl FnOnce(&T)) -> Self
.tap_deref() only in debug builds, and is erased in release
builds.