#[cfg(target_arch = "x86_64")]
#[inline(always)]
pub fn addcarry_u64(x: u64, y: u64, c: u8) -> (u64, u8) {
use core::arch::x86_64::_addcarry_u64;
let mut d = 0u64;
let cc = _addcarry_u64(c, x, y, &mut d);
(d, cc)
}
#[cfg(not(target_arch = "x86_64"))]
#[inline(always)]
pub const fn addcarry_u64(x: u64, y: u64, c: u8) -> (u64, u8) {
let z = (x as u128).wrapping_add(y as u128).wrapping_add(c as u128);
(z as u64, (z >> 64) as u8)
}
#[cfg(target_arch = "x86_64")]
#[inline(always)]
pub fn subborrow_u64(x: u64, y: u64, c: u8) -> (u64, u8) {
use core::arch::x86_64::_subborrow_u64;
let mut d = 0u64;
let cc = _subborrow_u64(c, x, y, &mut d);
(d, cc)
}
#[cfg(not(target_arch = "x86_64"))]
#[inline(always)]
pub const fn subborrow_u64(x: u64, y: u64, c: u8) -> (u64, u8) {
let z = (x as u128).wrapping_sub(y as u128).wrapping_sub(c as u128);
(z as u64, (z >> 127) as u8)
}
#[cfg(target_arch = "x86_64")]
#[inline(always)]
pub fn umull(x: u64, y: u64) -> (u64, u64) {
use core::arch::x86_64::_mulx_u64;
unsafe {
let mut hi: u64 = 0u64;
let low = _mulx_u64(x, y, &mut hi);
(low, hi)
}
}
#[cfg(not(target_arch = "x86_64"))]
#[inline(always)]
pub const fn umull(x: u64, y: u64) -> (u64, u64) {
let z = (x as u128) * (y as u128);
(z as u64, (z >> 64) as u64)
}
#[inline(always)]
pub const fn umull_add(x: u64, y: u64, z: u64) -> (u64, u64) {
let t = ((x as u128) * (y as u128)).wrapping_add(z as u128);
(t as u64, (t >> 64) as u64)
}
#[inline(always)]
pub const fn umull_add2(x: u64, y: u64, z1: u64, z2: u64) -> (u64, u64) {
let t = ((x as u128) * (y as u128))
.wrapping_add(z1 as u128)
.wrapping_add(z2 as u128);
(t as u64, (t >> 64) as u64)
}
#[inline(always)]
pub const fn umull_x2(x1: u64, y1: u64, x2: u64, y2: u64) -> (u64, u64) {
let z1 = (x1 as u128) * (y1 as u128);
let z2 = (x2 as u128) * (y2 as u128);
let z = z1.wrapping_add(z2);
(z as u64, (z >> 64) as u64)
}
#[inline(always)]
pub const fn umull_x2_add(x1: u64, y1: u64, x2: u64, y2: u64, z3: u64) -> (u64, u64) {
let z1 = (x1 as u128) * (y1 as u128);
let z2 = (x2 as u128) * (y2 as u128);
let z = z1.wrapping_add(z2).wrapping_add(z3 as u128);
(z as u64, (z >> 64) as u64)
}
#[inline(always)]
pub const fn sgnw(x: u64) -> u64 {
((x as i64) >> 63) as u64
}
#[cfg(any(
all(target_arch = "x86_64", target_feature = "lzcnt"),
target_arch = "aarch64",
))]
#[inline(always)]
pub const fn lzcnt(x: u64) -> u32 {
x.leading_zeros()
}
#[cfg(not(any(
all(target_arch = "x86_64", target_feature = "lzcnt"),
target_arch = "aarch64",
)))]
pub const fn lzcnt(x: u64) -> u32 {
let m = sgnw((x >> 32).wrapping_sub(1));
let s = m & 32;
let x = (x >> 32) ^ (m & (x ^ (x >> 32)));
let m = sgnw((x >> 16).wrapping_sub(1));
let s = s | (m & 16);
let x = (x >> 16) ^ (m & (x ^ (x >> 16)));
let m = sgnw((x >> 8).wrapping_sub(1));
let s = s | (m & 8);
let x = (x >> 8) ^ (m & (x ^ (x >> 8)));
let m = sgnw((x >> 4).wrapping_sub(1));
let s = s | (m & 4);
let x = (x >> 4) ^ (m & (x ^ (x >> 4)));
let m = sgnw((x >> 2).wrapping_sub(1));
let s = s | (m & 2);
let x = (x >> 2) ^ (m & (x ^ (x >> 2)));
let s = s.wrapping_add(2u64.wrapping_sub(x) & (x.wrapping_sub(3) >> 2));
s as u32
}