pub fn dispatch_optimal_size(len: u32, subgroup_size: u32) -> u32