pub fn dequantize_simd(input: &[i8], output: &mut [f32], params: &QuantParams)
SIMD-dispatched dequantization