pub fn sigmoid_slice_dispatch(input: &[f32], output: &mut [f32])
Fast sigmoid applied element-wise: output[i] = 1 / (1 + exp(-input[i])).
output[i] = 1 / (1 + exp(-input[i]))