pub fn simd_squared_distances(x1: &Array2<f64>, x2: &Array2<f64>) -> Array2<f64>
SIMD-accelerated distance matrix computation