pub fn warp_broadcast(lanes: &[f64], leader: usize) -> Vec<f64>
Simulate a warp-level broadcast: every lane gets lane_val[leader].
lane_val[leader]