pub fn quantize_f16(checkpoint: &mut HashMap<String, Tensor>) -> Result<()>
Quantize the float tensors to f16.