pub fn gpu_axpy(a: f64, x: &[f64], y: &mut Vec<f64>)
In-place AXPY: y ← a·x + y.
Panics if x.len() != y.len().
x.len() != y.len()