pub fn launch_ref<R: Runtime, F: Float + CubeElement>(
client: &ComputeClient<R::Server>,
input: &TensorHandleRef<'_, R>,
output: &TensorHandleRef<'_, R>,
scale: &TensorHandleRef<'_, R>,
out_scale: &TensorHandleRef<'_, R>,
scheme: &QuantScheme,
)