include!("macros.rs");
#[cfg(not(any(target_feature = "cmpxchg16b", portable_atomic_target_feature = "cmpxchg16b")))]
#[path = "../fallback/outline_atomics.rs"]
mod fallback;
#[cfg(not(portable_atomic_no_outline_atomics))]
#[cfg(not(target_env = "sgx"))]
#[path = "detect/x86_64.rs"]
mod detect;
#[cfg(not(portable_atomic_no_asm))]
use core::arch::asm;
use core::sync::atomic::Ordering;
use crate::utils::{Pair, U128};
macro_rules! debug_assert_cmpxchg16b {
() => {
#[cfg(not(any(
target_feature = "cmpxchg16b",
portable_atomic_target_feature = "cmpxchg16b",
)))]
{
debug_assert!(detect::detect().has_cmpxchg16b());
}
};
}
#[cfg(not(any(portable_atomic_no_outline_atomics, target_env = "sgx")))]
#[cfg(target_feature = "sse")]
macro_rules! debug_assert_vmovdqa_atomic {
() => {{
debug_assert_cmpxchg16b!();
debug_assert!(detect::detect().has_vmovdqa_atomic());
}};
}
#[allow(unused_macros)]
#[cfg(target_pointer_width = "32")]
macro_rules! ptr_modifier {
() => {
":e"
};
}
#[allow(unused_macros)]
#[cfg(target_pointer_width = "64")]
macro_rules! ptr_modifier {
() => {
""
};
}
#[cfg_attr(
not(any(target_feature = "cmpxchg16b", portable_atomic_target_feature = "cmpxchg16b")),
target_feature(enable = "cmpxchg16b")
)]
#[inline]
unsafe fn cmpxchg16b(dst: *mut u128, old: u128, new: u128) -> (u128, bool) {
debug_assert!(dst as usize % 16 == 0);
debug_assert_cmpxchg16b!();
unsafe {
let r: u8;
let old = U128 { whole: old };
let new = U128 { whole: new };
let (prev_lo, prev_hi);
macro_rules! cmpxchg16b {
($rdi:tt) => {
asm!(
"xchg {rbx_tmp}, rbx",
concat!("lock cmpxchg16b xmmword ptr [", $rdi, "]"),
"sete r8b",
"mov rbx, {rbx_tmp}", rbx_tmp = inout(reg) new.pair.lo => _,
in("rcx") new.pair.hi,
inout("rax") old.pair.lo => prev_lo,
inout("rdx") old.pair.hi => prev_hi,
in($rdi) dst,
out("r8b") r,
options(nostack),
)
};
}
#[cfg(target_pointer_width = "32")]
cmpxchg16b!("edi");
#[cfg(target_pointer_width = "64")]
cmpxchg16b!("rdi");
(U128 { pair: Pair { lo: prev_lo, hi: prev_hi } }.whole, r != 0)
}
}
#[cfg(not(any(portable_atomic_no_outline_atomics, target_env = "sgx")))]
#[cfg(target_feature = "sse")]
#[target_feature(enable = "avx")]
#[inline]
unsafe fn atomic_load_vmovdqa(src: *mut u128) -> u128 {
debug_assert!(src as usize % 16 == 0);
debug_assert_vmovdqa_atomic!();
unsafe {
let out: core::arch::x86_64::__m128;
asm!(
concat!("vmovdqa {out}, xmmword ptr [{src", ptr_modifier!(), "}]"),
src = in(reg) src,
out = out(xmm_reg) out,
options(nostack, preserves_flags),
);
core::mem::transmute(out)
}
}
#[cfg(not(any(portable_atomic_no_outline_atomics, target_env = "sgx")))]
#[cfg(target_feature = "sse")]
#[target_feature(enable = "avx")]
#[inline]
unsafe fn atomic_store_vmovdqa(dst: *mut u128, val: u128, order: Ordering) {
debug_assert!(dst as usize % 16 == 0);
debug_assert_vmovdqa_atomic!();
unsafe {
let val: core::arch::x86_64::__m128 = core::mem::transmute(val);
match order {
Ordering::Relaxed | Ordering::Release => {
asm!(
concat!("vmovdqa xmmword ptr [{dst", ptr_modifier!(), "}], {val}"),
dst = in(reg) dst,
val = in(xmm_reg) val,
options(nostack, preserves_flags),
);
}
Ordering::SeqCst => {
asm!(
concat!("vmovdqa xmmword ptr [{dst", ptr_modifier!(), "}], {val}"),
"mfence",
dst = in(reg) dst,
val = in(xmm_reg) val,
options(nostack, preserves_flags),
);
}
_ => unreachable!("{:?}", order),
}
}
}
#[cfg(not(all(
any(target_feature = "cmpxchg16b", portable_atomic_target_feature = "cmpxchg16b"),
any(portable_atomic_no_outline_atomics, target_env = "sgx", not(target_feature = "sse")),
)))]
macro_rules! load_store_detect {
(
vmovdqa = $vmovdqa:ident
cmpxchg16b = $cmpxchg16b:ident
fallback = $fallback:ident
) => {{
let cpuid = detect::detect();
#[cfg(not(any(
target_feature = "cmpxchg16b",
portable_atomic_target_feature = "cmpxchg16b",
)))]
{
if cpuid.has_cmpxchg16b() {
#[cfg(target_feature = "sse")]
{
if cpuid.has_vmovdqa_atomic() {
$vmovdqa
} else {
$cmpxchg16b
}
}
#[cfg(not(target_feature = "sse"))]
{
$cmpxchg16b
}
} else {
fallback::$fallback
}
}
#[cfg(any(target_feature = "cmpxchg16b", portable_atomic_target_feature = "cmpxchg16b"))]
{
if cpuid.has_vmovdqa_atomic() {
$vmovdqa
} else {
$cmpxchg16b
}
}
}};
}
#[inline]
unsafe fn atomic_load(src: *mut u128, _order: Ordering) -> u128 {
#[cfg(all(
any(target_feature = "cmpxchg16b", portable_atomic_target_feature = "cmpxchg16b"),
any(portable_atomic_no_outline_atomics, target_env = "sgx", not(target_feature = "sse")),
))]
unsafe {
atomic_load_cmpxchg16b(src)
}
#[cfg(not(all(
any(target_feature = "cmpxchg16b", portable_atomic_target_feature = "cmpxchg16b"),
any(portable_atomic_no_outline_atomics, target_env = "sgx", not(target_feature = "sse")),
)))]
unsafe {
ifunc!(unsafe fn(src: *mut u128) -> u128 {
load_store_detect! {
vmovdqa = atomic_load_vmovdqa
cmpxchg16b = atomic_load_cmpxchg16b
fallback = atomic_load_seqcst
}
})
}
}
#[cfg_attr(
not(any(target_feature = "cmpxchg16b", portable_atomic_target_feature = "cmpxchg16b")),
target_feature(enable = "cmpxchg16b")
)]
#[inline]
unsafe fn atomic_load_cmpxchg16b(src: *mut u128) -> u128 {
debug_assert!(src as usize % 16 == 0);
debug_assert_cmpxchg16b!();
unsafe {
let (out_lo, out_hi);
macro_rules! cmpxchg16b {
($rdi:tt) => {
asm!(
"mov {rbx_tmp}, rbx",
"xor rbx, rbx", concat!("lock cmpxchg16b xmmword ptr [", $rdi, "]"),
"mov rbx, {rbx_tmp}", rbx_tmp = out(reg) _,
in("rcx") 0_u64,
inout("rax") 0_u64 => out_lo,
inout("rdx") 0_u64 => out_hi,
in($rdi) src,
options(nostack),
)
};
}
#[cfg(target_pointer_width = "32")]
cmpxchg16b!("edi");
#[cfg(target_pointer_width = "64")]
cmpxchg16b!("rdi");
U128 { pair: Pair { lo: out_lo, hi: out_hi } }.whole
}
}
#[inline]
unsafe fn atomic_store(dst: *mut u128, val: u128, order: Ordering) {
#[cfg(all(
any(target_feature = "cmpxchg16b", portable_atomic_target_feature = "cmpxchg16b"),
any(portable_atomic_no_outline_atomics, target_env = "sgx", not(target_feature = "sse")),
))]
unsafe {
let _ = order;
atomic_store_cmpxchg16b(dst, val);
}
#[cfg(not(all(
any(target_feature = "cmpxchg16b", portable_atomic_target_feature = "cmpxchg16b"),
any(portable_atomic_no_outline_atomics, target_env = "sgx", not(target_feature = "sse")),
)))]
unsafe {
#[cfg(target_feature = "sse")]
fn_alias! {
#[target_feature(enable = "avx")]
unsafe fn(dst: *mut u128, val: u128);
atomic_store_vmovdqa_non_seqcst = atomic_store_vmovdqa(Ordering::Release);
atomic_store_vmovdqa_seqcst = atomic_store_vmovdqa(Ordering::SeqCst);
}
match order {
Ordering::Relaxed | Ordering::Release => {
ifunc!(unsafe fn(dst: *mut u128, val: u128) {
load_store_detect! {
vmovdqa = atomic_store_vmovdqa_non_seqcst
cmpxchg16b = atomic_store_cmpxchg16b
fallback = atomic_store_non_seqcst
}
});
}
Ordering::SeqCst => {
ifunc!(unsafe fn(dst: *mut u128, val: u128) {
load_store_detect! {
vmovdqa = atomic_store_vmovdqa_seqcst
cmpxchg16b = atomic_store_cmpxchg16b
fallback = atomic_store_seqcst
}
});
}
_ => unreachable!("{:?}", order),
}
}
}
#[cfg_attr(
not(any(target_feature = "cmpxchg16b", portable_atomic_target_feature = "cmpxchg16b")),
target_feature(enable = "cmpxchg16b")
)]
unsafe fn atomic_store_cmpxchg16b(dst: *mut u128, val: u128) {
unsafe {
atomic_swap_cmpxchg16b(dst, val, Ordering::SeqCst);
}
}
#[inline]
unsafe fn atomic_compare_exchange(
dst: *mut u128,
old: u128,
new: u128,
_success: Ordering,
_failure: Ordering,
) -> Result<u128, u128> {
#[cfg(any(target_feature = "cmpxchg16b", portable_atomic_target_feature = "cmpxchg16b"))]
let (prev, ok) = unsafe { cmpxchg16b(dst, old, new) };
#[cfg(not(any(target_feature = "cmpxchg16b", portable_atomic_target_feature = "cmpxchg16b")))]
let (prev, ok) = unsafe {
ifunc!(unsafe fn(dst: *mut u128, old: u128, new: u128) -> (u128, bool) {
if detect::detect().has_cmpxchg16b() {
cmpxchg16b
} else {
fallback::atomic_compare_exchange_seqcst
}
})
};
if ok {
Ok(prev)
} else {
Err(prev)
}
}
use atomic_compare_exchange as atomic_compare_exchange_weak;
#[cfg(any(target_feature = "cmpxchg16b", portable_atomic_target_feature = "cmpxchg16b"))]
use atomic_swap_cmpxchg16b as atomic_swap;
#[cfg_attr(
not(any(target_feature = "cmpxchg16b", portable_atomic_target_feature = "cmpxchg16b")),
target_feature(enable = "cmpxchg16b")
)]
#[inline]
unsafe fn atomic_swap_cmpxchg16b(dst: *mut u128, val: u128, _order: Ordering) -> u128 {
debug_assert!(dst as usize % 16 == 0);
debug_assert_cmpxchg16b!();
unsafe {
let val = U128 { whole: val };
let (mut prev_lo, mut prev_hi);
macro_rules! cmpxchg16b {
($rdi:tt) => {
asm!(
"xchg {rbx_tmp}, rbx",
concat!("mov rax, qword ptr [", $rdi, "]"),
concat!("mov rdx, qword ptr [", $rdi, " + 8]"),
"2:",
concat!("lock cmpxchg16b xmmword ptr [", $rdi, "]"),
"jne 2b",
"mov rbx, {rbx_tmp}", rbx_tmp = inout(reg) val.pair.lo => _,
in("rcx") val.pair.hi,
out("rax") prev_lo,
out("rdx") prev_hi,
in($rdi) dst,
options(nostack),
)
};
}
#[cfg(target_pointer_width = "32")]
cmpxchg16b!("edi");
#[cfg(target_pointer_width = "64")]
cmpxchg16b!("rdi");
U128 { pair: Pair { lo: prev_lo, hi: prev_hi } }.whole
}
}
macro_rules! atomic_rmw_cas_3 {
($name:ident as $reexport_name:ident, $($op:tt)*) => {
#[cfg(any(target_feature = "cmpxchg16b", portable_atomic_target_feature = "cmpxchg16b"))]
use $name as $reexport_name;
#[cfg_attr(
not(any(target_feature = "cmpxchg16b", portable_atomic_target_feature = "cmpxchg16b")),
target_feature(enable = "cmpxchg16b")
)]
#[inline]
unsafe fn $name(dst: *mut u128, val: u128, _order: Ordering) -> u128 {
debug_assert!(dst as usize % 16 == 0);
debug_assert_cmpxchg16b!();
unsafe {
let val = U128 { whole: val };
let (mut prev_lo, mut prev_hi);
macro_rules! cmpxchg16b {
($rdi:tt) => {
asm!(
"mov {rbx_tmp}, rbx",
concat!("mov rax, qword ptr [", $rdi, "]"),
concat!("mov rdx, qword ptr [", $rdi, " + 8]"),
"2:",
$($op)*
concat!("lock cmpxchg16b xmmword ptr [", $rdi, "]"),
"jne 2b",
"mov rbx, {rbx_tmp}", rbx_tmp = out(reg) _,
out("rcx") _,
out("rax") prev_lo,
out("rdx") prev_hi,
in($rdi) dst,
in("rsi") val.pair.lo,
in("r8") val.pair.hi,
options(nostack),
)
};
}
#[cfg(target_pointer_width = "32")]
cmpxchg16b!("edi");
#[cfg(target_pointer_width = "64")]
cmpxchg16b!("rdi");
U128 { pair: Pair { lo: prev_lo, hi: prev_hi } }.whole
}
}
};
}
macro_rules! atomic_rmw_cas_2 {
($name:ident as $reexport_name:ident, $($op:tt)*) => {
#[cfg(any(target_feature = "cmpxchg16b", portable_atomic_target_feature = "cmpxchg16b"))]
use $name as $reexport_name;
#[cfg_attr(
not(any(target_feature = "cmpxchg16b", portable_atomic_target_feature = "cmpxchg16b")),
target_feature(enable = "cmpxchg16b")
)]
#[inline]
unsafe fn $name(dst: *mut u128, _order: Ordering) -> u128 {
debug_assert!(dst as usize % 16 == 0);
debug_assert_cmpxchg16b!();
unsafe {
let (mut prev_lo, mut prev_hi);
macro_rules! cmpxchg16b {
($rdi:tt) => {
asm!(
"mov {rbx_tmp}, rbx",
concat!("mov rax, qword ptr [", $rdi, "]"),
concat!("mov rdx, qword ptr [", $rdi, " + 8]"),
"2:",
$($op)*
concat!("lock cmpxchg16b xmmword ptr [", $rdi, "]"),
"jne 2b",
"mov rbx, {rbx_tmp}", rbx_tmp = out(reg) _,
out("rcx") _,
out("rax") prev_lo,
out("rdx") prev_hi,
in($rdi) dst,
options(nostack),
)
};
}
#[cfg(target_pointer_width = "32")]
cmpxchg16b!("edi");
#[cfg(target_pointer_width = "64")]
cmpxchg16b!("rdi");
U128 { pair: Pair { lo: prev_lo, hi: prev_hi } }.whole
}
}
};
}
atomic_rmw_cas_3! {
atomic_add_cmpxchg16b as atomic_add,
"mov rbx, rax",
"add rbx, rsi",
"mov rcx, rdx",
"adc rcx, r8",
}
atomic_rmw_cas_3! {
atomic_sub_cmpxchg16b as atomic_sub,
"mov rbx, rax",
"sub rbx, rsi",
"mov rcx, rdx",
"sbb rcx, r8",
}
atomic_rmw_cas_3! {
atomic_and_cmpxchg16b as atomic_and,
"mov rbx, rax",
"and rbx, rsi",
"mov rcx, rdx",
"and rcx, r8",
}
atomic_rmw_cas_3! {
atomic_nand_cmpxchg16b as atomic_nand,
"mov rbx, rax",
"and rbx, rsi",
"not rbx",
"mov rcx, rdx",
"and rcx, r8",
"not rcx",
}
atomic_rmw_cas_3! {
atomic_or_cmpxchg16b as atomic_or,
"mov rbx, rax",
"or rbx, rsi",
"mov rcx, rdx",
"or rcx, r8",
}
atomic_rmw_cas_3! {
atomic_xor_cmpxchg16b as atomic_xor,
"mov rbx, rax",
"xor rbx, rsi",
"mov rcx, rdx",
"xor rcx, r8",
}
atomic_rmw_cas_2! {
atomic_not_cmpxchg16b as atomic_not,
"mov rbx, rax",
"not rbx",
"mov rcx, rdx",
"not rcx",
}
atomic_rmw_cas_2! {
atomic_neg_cmpxchg16b as atomic_neg,
"mov rbx, rax",
"neg rbx",
"mov rcx, 0",
"sbb rcx, rdx",
}
atomic_rmw_cas_3! {
atomic_max_cmpxchg16b as atomic_max,
"cmp rsi, rax",
"mov rcx, r8",
"sbb rcx, rdx",
"mov rcx, r8",
"cmovl rcx, rdx",
"mov rbx, rsi",
"cmovl rbx, rax",
}
atomic_rmw_cas_3! {
atomic_umax_cmpxchg16b as atomic_umax,
"cmp rsi, rax",
"mov rcx, r8",
"sbb rcx, rdx",
"mov rcx, r8",
"cmovb rcx, rdx",
"mov rbx, rsi",
"cmovb rbx, rax",
}
atomic_rmw_cas_3! {
atomic_min_cmpxchg16b as atomic_min,
"cmp rsi, rax",
"mov rcx, r8",
"sbb rcx, rdx",
"mov rcx, r8",
"cmovge rcx, rdx",
"mov rbx, rsi",
"cmovge rbx, rax",
}
atomic_rmw_cas_3! {
atomic_umin_cmpxchg16b as atomic_umin,
"cmp rsi, rax",
"mov rcx, r8",
"sbb rcx, rdx",
"mov rcx, r8",
"cmovae rcx, rdx",
"mov rbx, rsi",
"cmovae rbx, rax",
}
macro_rules! atomic_rmw_with_ifunc {
(
unsafe fn $name:ident($($arg:tt)*) $(-> $ret_ty:ty)?;
cmpxchg16b = $cmpxchg16b_fn:ident;
fallback = $seqcst_fallback_fn:ident;
) => {
#[cfg(not(any(
target_feature = "cmpxchg16b",
portable_atomic_target_feature = "cmpxchg16b",
)))]
#[inline]
unsafe fn $name($($arg)*, _order: Ordering) $(-> $ret_ty)? {
fn_alias! {
#[cfg_attr(
not(any(
target_feature = "cmpxchg16b",
portable_atomic_target_feature = "cmpxchg16b",
)),
target_feature(enable = "cmpxchg16b")
)]
unsafe fn($($arg)*) $(-> $ret_ty)?;
cmpxchg16b_seqcst_fn = $cmpxchg16b_fn(Ordering::SeqCst);
}
unsafe {
ifunc!(unsafe fn($($arg)*) $(-> $ret_ty)? {
if detect::detect().has_cmpxchg16b() {
cmpxchg16b_seqcst_fn
} else {
fallback::$seqcst_fallback_fn
}
})
}
}
};
}
atomic_rmw_with_ifunc! {
unsafe fn atomic_swap(dst: *mut u128, val: u128) -> u128;
cmpxchg16b = atomic_swap_cmpxchg16b;
fallback = atomic_swap_seqcst;
}
atomic_rmw_with_ifunc! {
unsafe fn atomic_add(dst: *mut u128, val: u128) -> u128;
cmpxchg16b = atomic_add_cmpxchg16b;
fallback = atomic_add_seqcst;
}
atomic_rmw_with_ifunc! {
unsafe fn atomic_sub(dst: *mut u128, val: u128) -> u128;
cmpxchg16b = atomic_sub_cmpxchg16b;
fallback = atomic_sub_seqcst;
}
atomic_rmw_with_ifunc! {
unsafe fn atomic_and(dst: *mut u128, val: u128) -> u128;
cmpxchg16b = atomic_and_cmpxchg16b;
fallback = atomic_and_seqcst;
}
atomic_rmw_with_ifunc! {
unsafe fn atomic_nand(dst: *mut u128, val: u128) -> u128;
cmpxchg16b = atomic_nand_cmpxchg16b;
fallback = atomic_nand_seqcst;
}
atomic_rmw_with_ifunc! {
unsafe fn atomic_or(dst: *mut u128, val: u128) -> u128;
cmpxchg16b = atomic_or_cmpxchg16b;
fallback = atomic_or_seqcst;
}
atomic_rmw_with_ifunc! {
unsafe fn atomic_xor(dst: *mut u128, val: u128) -> u128;
cmpxchg16b = atomic_xor_cmpxchg16b;
fallback = atomic_xor_seqcst;
}
atomic_rmw_with_ifunc! {
unsafe fn atomic_max(dst: *mut u128, val: u128) -> u128;
cmpxchg16b = atomic_max_cmpxchg16b;
fallback = atomic_max_seqcst;
}
atomic_rmw_with_ifunc! {
unsafe fn atomic_umax(dst: *mut u128, val: u128) -> u128;
cmpxchg16b = atomic_umax_cmpxchg16b;
fallback = atomic_umax_seqcst;
}
atomic_rmw_with_ifunc! {
unsafe fn atomic_min(dst: *mut u128, val: u128) -> u128;
cmpxchg16b = atomic_min_cmpxchg16b;
fallback = atomic_min_seqcst;
}
atomic_rmw_with_ifunc! {
unsafe fn atomic_umin(dst: *mut u128, val: u128) -> u128;
cmpxchg16b = atomic_umin_cmpxchg16b;
fallback = atomic_umin_seqcst;
}
atomic_rmw_with_ifunc! {
unsafe fn atomic_not(dst: *mut u128) -> u128;
cmpxchg16b = atomic_not_cmpxchg16b;
fallback = atomic_not_seqcst;
}
atomic_rmw_with_ifunc! {
unsafe fn atomic_neg(dst: *mut u128) -> u128;
cmpxchg16b = atomic_neg_cmpxchg16b;
fallback = atomic_neg_seqcst;
}
#[inline]
fn is_lock_free() -> bool {
#[cfg(any(target_feature = "cmpxchg16b", portable_atomic_target_feature = "cmpxchg16b"))]
{
true
}
#[cfg(not(any(target_feature = "cmpxchg16b", portable_atomic_target_feature = "cmpxchg16b")))]
{
detect::detect().has_cmpxchg16b()
}
}
const IS_ALWAYS_LOCK_FREE: bool =
cfg!(any(target_feature = "cmpxchg16b", portable_atomic_target_feature = "cmpxchg16b"));
atomic128!(AtomicI128, i128, atomic_max, atomic_min);
atomic128!(AtomicU128, u128, atomic_umax, atomic_umin);
#[allow(clippy::undocumented_unsafe_blocks, clippy::wildcard_imports)]
#[cfg(test)]
mod tests {
use super::*;
test_atomic_int!(i128);
test_atomic_int!(u128);
stress_test!(u128);
}