#if F_SIZE == 32
#define F_UINT uint32_t
#define F_ULONG uint64_t
#define MANT_SIZE 23
#define EXP_SIZE 8
#elif F_SIZE == 64
#define F_UHALF uint32_t
#define F_UINT uint64_t
#ifdef HAVE_INT128
#define F_ULONG uint128_t
#endif
#define MANT_SIZE 52
#define EXP_SIZE 11
#elif F_SIZE == 128
#define F_UHALF uint64_t
#define F_UINT uint128_t
#define MANT_SIZE 112
#define EXP_SIZE 15
#else
#error unsupported F_SIZE
#endif
#define EXP_MASK ((1 << EXP_SIZE) - 1)
#define MANT_MASK (((F_UINT)1 << MANT_SIZE) - 1)
#define SIGN_MASK ((F_UINT)1 << (F_SIZE - 1))
#define IMANT_SIZE (F_SIZE - 2)
#define RND_SIZE (IMANT_SIZE - MANT_SIZE)
#define QNAN_MASK ((F_UINT)1 << (MANT_SIZE - 1))
#define EXP_BIAS ((1 << (EXP_SIZE - 1)) - 1)
#define F_QNAN glue(F_QNAN, F_SIZE)
#define clz glue(clz, F_SIZE)
#define pack_sf glue(pack_sf, F_SIZE)
#define unpack_sf glue(unpack_sf, F_SIZE)
#define rshift_rnd glue(rshift_rnd, F_SIZE)
#define round_pack_sf glue(roundpack_sf, F_SIZE)
#define normalize_sf glue(normalize_sf, F_SIZE)
#define normalize2_sf glue(normalize2_sf, F_SIZE)
#define issignan_sf glue(issignan_sf, F_SIZE)
#define isnan_sf glue(isnan_sf, F_SIZE)
#define add_sf glue(add_sf, F_SIZE)
#define mul_sf glue(mul_sf, F_SIZE)
#define fma_sf glue(fma_sf, F_SIZE)
#define div_sf glue(div_sf, F_SIZE)
#define sqrt_sf glue(sqrt_sf, F_SIZE)
#define normalize_subnormal_sf glue(normalize_subnormal_sf, F_SIZE)
#define divrem_u glue(divrem_u, F_SIZE)
#define sqrtrem_u glue(sqrtrem_u, F_SIZE)
#define mul_u glue(mul_u, F_SIZE)
#define cvt_sf32_sf glue(cvt_sf32_sf, F_SIZE)
#define cvt_sf64_sf glue(cvt_sf64_sf, F_SIZE)
static const F_UINT F_QNAN = (((F_UINT)EXP_MASK << MANT_SIZE) | ((F_UINT)1 << (MANT_SIZE - 1)));
static inline F_UINT pack_sf(uint32_t a_sign, uint32_t a_exp, F_UINT a_mant)
{
return ((F_UINT)a_sign << (F_SIZE - 1)) |
((F_UINT)a_exp << MANT_SIZE) |
(a_mant & MANT_MASK);
}
static inline F_UINT unpack_sf(uint32_t *pa_sign, int32_t *pa_exp,
F_UINT a)
{
*pa_sign = a >> (F_SIZE - 1);
*pa_exp = (a >> MANT_SIZE) & EXP_MASK;
return a & MANT_MASK;
}
static F_UINT rshift_rnd(F_UINT a, int d)
{
F_UINT mask;
if (d != 0) {
if (d >= F_SIZE) {
a = (a != 0);
} else {
mask = ((F_UINT)1 << d) - 1;
a = (a >> d) | ((a & mask) != 0);
}
}
return a;
}
#if F_USE_FFLAGS
#define FFLAGS_PARAM , uint32_t *pfflags
#define FFLAGS_ARG , pfflags
#else
#define FFLAGS_PARAM
#define FFLAGS_ARG
#endif
static F_UINT round_pack_sf(uint32_t a_sign, int a_exp, F_UINT a_mant,
RoundingModeEnum rm FFLAGS_PARAM)
{
int diff;
uint32_t addend, rnd_bits;
switch(rm) {
case RM_RNE:
case RM_RMM:
addend = (1 << (RND_SIZE - 1));
break;
case RM_RTZ:
addend = 0;
break;
default:
case RM_RDN:
case RM_RUP:
if (a_sign ^ (rm & 1))
addend = (1 << RND_SIZE) - 1;
else
addend = 0;
break;
}
if (a_exp <= 0) {
BOOL is_subnormal;
is_subnormal = (a_exp < 0 ||
(a_mant + addend) < ((F_UINT)1 << (F_SIZE - 1)));
diff = 1 - a_exp;
a_mant = rshift_rnd(a_mant, diff);
rnd_bits = a_mant & ((1 << RND_SIZE ) - 1);
if (is_subnormal && rnd_bits != 0) {
#if F_USE_FFLAGS
*pfflags |= FFLAG_UNDERFLOW;
#endif
}
a_exp = 1;
} else {
rnd_bits = a_mant & ((1 << RND_SIZE ) - 1);
}
#if F_USE_FFLAGS
if (rnd_bits != 0)
*pfflags |= FFLAG_INEXACT;
#endif
a_mant = (a_mant + addend) >> RND_SIZE;
if (rm == RM_RNE && rnd_bits == (1 << (RND_SIZE - 1)))
a_mant &= ~1;
a_exp += a_mant >> (MANT_SIZE + 1);
if (a_mant <= MANT_MASK) {
a_exp = 0;
} else if (a_exp >= EXP_MASK) {
if (addend == 0) {
a_exp = EXP_MASK - 1;
a_mant = MANT_MASK;
} else {
a_exp = EXP_MASK;
a_mant = 0;
}
#if F_USE_FFLAGS
*pfflags |= FFLAG_OVERFLOW | FFLAG_INEXACT;
#endif
}
return pack_sf(a_sign, a_exp, a_mant);
}
static F_UINT normalize_sf(uint32_t a_sign, int a_exp, F_UINT a_mant,
RoundingModeEnum rm FFLAGS_PARAM)
{
int shift;
shift = clz(a_mant) - (F_SIZE - 1 - IMANT_SIZE);
assert(shift >= 0);
a_exp -= shift;
a_mant <<= shift;
return round_pack_sf(a_sign, a_exp, a_mant, rm FFLAGS_ARG);
}
static inline F_UINT normalize_subnormal_sf(int32_t *pa_exp, F_UINT a_mant)
{
int shift;
shift = MANT_SIZE - ((F_SIZE - 1 - clz(a_mant)));
*pa_exp = 1 - shift;
return a_mant << shift;
}
#if F_USE_FFLAGS
F_STATIC BOOL issignan_sf(F_UINT a)
{
uint32_t a_exp1;
F_UINT a_mant;
a_exp1 = (a >> (MANT_SIZE - 1)) & ((1 << (EXP_SIZE + 1)) - 1);
a_mant = a & MANT_MASK;
return (a_exp1 == (2 * EXP_MASK) && a_mant != 0);
}
#endif
#ifndef F_NORMALIZE_ONLY
F_STATIC BOOL isnan_sf(F_UINT a)
{
uint32_t a_exp;
F_UINT a_mant;
a_exp = (a >> MANT_SIZE) & EXP_MASK;
a_mant = a & MANT_MASK;
return (a_exp == EXP_MASK && a_mant != 0);
}
F_STATIC F_UINT add_sf(F_UINT a, F_UINT b, RoundingModeEnum rm FFLAGS_PARAM)
{
uint32_t a_sign, b_sign, a_exp, b_exp;
F_UINT tmp, a_mant, b_mant;
if ((a & ~SIGN_MASK) < (b & ~SIGN_MASK)) {
tmp = a;
a = b;
b = tmp;
}
a_sign = a >> (F_SIZE - 1);
b_sign = b >> (F_SIZE - 1);
a_exp = (a >> MANT_SIZE) & EXP_MASK;
b_exp = (b >> MANT_SIZE) & EXP_MASK;
a_mant = (a & MANT_MASK) << 3;
b_mant = (b & MANT_MASK) << 3;
if (unlikely(a_exp == EXP_MASK)) {
if (a_mant != 0) {
#if F_USE_FFLAGS
if (!(a_mant & (QNAN_MASK << 3)) || issignan_sf(b))
*pfflags |= FFLAG_INVALID_OP;
#endif
return F_QNAN;
} else if (b_exp == EXP_MASK && a_sign != b_sign) {
#if F_USE_FFLAGS
*pfflags |= FFLAG_INVALID_OP;
#endif
return F_QNAN;
} else {
return a;
}
}
if (a_exp == 0) {
a_exp = 1;
} else {
a_mant |= (F_UINT)1 << (MANT_SIZE + 3);
}
if (b_exp == 0) {
b_exp = 1;
} else {
b_mant |= (F_UINT)1 << (MANT_SIZE + 3);
}
b_mant = rshift_rnd(b_mant, a_exp - b_exp);
if (a_sign == b_sign) {
a_mant += b_mant;
} else {
a_mant -= b_mant;
if (a_mant == 0) {
a_sign = (rm == RM_RDN);
}
}
a_exp += (RND_SIZE - 3);
return normalize_sf(a_sign, a_exp, a_mant, rm FFLAGS_ARG);
}
F_STATIC F_UINT glue(sub_sf, F_SIZE)(F_UINT a, F_UINT b, RoundingModeEnum rm FFLAGS_PARAM)
{
return add_sf(a, b ^ SIGN_MASK, rm FFLAGS_ARG);
}
#ifdef F_ULONG
static F_UINT mul_u(F_UINT *plow, F_UINT a, F_UINT b)
{
F_ULONG r;
r = (F_ULONG)a * (F_ULONG)b;
*plow = r;
return r >> F_SIZE;
}
#else
#define FH_SIZE (F_SIZE / 2)
static F_UINT mul_u(F_UINT *plow, F_UINT a, F_UINT b)
{
F_UHALF a0, a1, b0, b1, r0, r1, r2, r3;
F_UINT r00, r01, r10, r11, c;
a0 = a;
a1 = a >> FH_SIZE;
b0 = b;
b1 = b >> FH_SIZE;
r00 = (F_UINT)a0 * (F_UINT)b0;
r01 = (F_UINT)a0 * (F_UINT)b1;
r10 = (F_UINT)a1 * (F_UINT)b0;
r11 = (F_UINT)a1 * (F_UINT)b1;
r0 = r00;
c = (r00 >> FH_SIZE) + (F_UHALF)r01 + (F_UHALF)r10;
r1 = c;
c = (c >> FH_SIZE) + (r01 >> FH_SIZE) + (r10 >> FH_SIZE) + (F_UHALF)r11;
r2 = c;
r3 = (c >> FH_SIZE) + (r11 >> FH_SIZE);
*plow = ((F_UINT)r1 << FH_SIZE) | r0;
return ((F_UINT)r3 << FH_SIZE) | r2;
}
#undef FH_SIZE
#endif
F_STATIC F_UINT mul_sf(F_UINT a, F_UINT b, RoundingModeEnum rm FFLAGS_PARAM)
{
uint32_t a_sign, b_sign, r_sign;
int32_t a_exp, b_exp, r_exp;
F_UINT a_mant, b_mant, r_mant, r_mant_low;
a_sign = a >> (F_SIZE - 1);
b_sign = b >> (F_SIZE - 1);
r_sign = a_sign ^ b_sign;
a_exp = (a >> MANT_SIZE) & EXP_MASK;
b_exp = (b >> MANT_SIZE) & EXP_MASK;
a_mant = a & MANT_MASK;
b_mant = b & MANT_MASK;
if (a_exp == EXP_MASK || b_exp == EXP_MASK) {
if (isnan_sf(a) || isnan_sf(b)) {
#if F_USE_FFLAGS
if (issignan_sf(a) || issignan_sf(b)) {
*pfflags |= FFLAG_INVALID_OP;
}
#endif
return F_QNAN;
} else {
if ((a_exp == EXP_MASK && (b_exp == 0 && b_mant == 0)) ||
(b_exp == EXP_MASK && (a_exp == 0 && a_mant == 0))) {
#if F_USE_FFLAGS
*pfflags |= FFLAG_INVALID_OP;
#endif
return F_QNAN;
} else {
return pack_sf(r_sign, EXP_MASK, 0);
}
}
}
if (a_exp == 0) {
if (a_mant == 0)
return pack_sf(r_sign, 0, 0);
a_mant = normalize_subnormal_sf(&a_exp, a_mant);
} else {
a_mant |= (F_UINT)1 << MANT_SIZE;
}
if (b_exp == 0) {
if (b_mant == 0)
return pack_sf(r_sign, 0, 0);
b_mant = normalize_subnormal_sf(&b_exp, b_mant);
} else {
b_mant |= (F_UINT)1 << MANT_SIZE;
}
r_exp = a_exp + b_exp - (1 << (EXP_SIZE - 1)) + 2;
r_mant = mul_u(&r_mant_low,a_mant << RND_SIZE, b_mant << (RND_SIZE + 1));
r_mant |= (r_mant_low != 0);
return normalize_sf(r_sign, r_exp, r_mant, rm FFLAGS_ARG);
}
#ifdef F_ULONG
static F_UINT divrem_u(F_UINT *pr, F_UINT ah, F_UINT al, F_UINT b)
{
F_ULONG a;
a = ((F_ULONG)ah << F_SIZE) | al;
*pr = a % b;
return a / b;
}
#else
static F_UINT divrem_u(F_UINT *pr, F_UINT a1, F_UINT a0, F_UINT b)
{
int i, qb, ab;
assert(a1 < b);
for(i = 0; i < F_SIZE; i++) {
ab = a1 >> (F_SIZE - 1);
a1 = (a1 << 1) | (a0 >> (F_SIZE - 1));
if (ab || a1 >= b) {
a1 -= b;
qb = 1;
} else {
qb = 0;
}
a0 = (a0 << 1) | qb;
}
*pr = a1;
return a0;
}
#endif
F_STATIC F_UINT div_sf(F_UINT a, F_UINT b, RoundingModeEnum rm FFLAGS_PARAM)
{
uint32_t a_sign, b_sign, r_sign;
int32_t a_exp, b_exp, r_exp;
F_UINT a_mant, b_mant, r_mant, r;
a_sign = a >> (F_SIZE - 1);
b_sign = b >> (F_SIZE - 1);
r_sign = a_sign ^ b_sign;
a_exp = (a >> MANT_SIZE) & EXP_MASK;
b_exp = (b >> MANT_SIZE) & EXP_MASK;
a_mant = a & MANT_MASK;
b_mant = b & MANT_MASK;
if (a_exp == EXP_MASK) {
if (a_mant != 0 || isnan_sf(b)) {
#if F_USE_FFLAGS
if (issignan_sf(a) || issignan_sf(b)) {
*pfflags |= FFLAG_INVALID_OP;
}
#endif
return F_QNAN;
} else if (b_exp == EXP_MASK) {
#if F_USE_FFLAGS
*pfflags |= FFLAG_INVALID_OP;
#endif
return F_QNAN;
} else {
return pack_sf(r_sign, EXP_MASK, 0);
}
} else if (b_exp == EXP_MASK) {
if (b_mant != 0) {
#if F_USE_FFLAGS
if (issignan_sf(a) || issignan_sf(b)) {
*pfflags |= FFLAG_INVALID_OP;
}
#endif
return F_QNAN;
} else {
return pack_sf(r_sign, 0, 0);
}
}
if (b_exp == 0) {
if (b_mant == 0) {
if (a_exp == 0 && a_mant == 0) {
#if F_USE_FFLAGS
*pfflags |= FFLAG_INVALID_OP;
#endif
return F_QNAN;
} else {
#if F_USE_FFLAGS
*pfflags |= FFLAG_DIVIDE_ZERO;
#endif
return pack_sf(r_sign, EXP_MASK, 0);
}
}
b_mant = normalize_subnormal_sf(&b_exp, b_mant);
} else {
b_mant |= (F_UINT)1 << MANT_SIZE;
}
if (a_exp == 0) {
if (a_mant == 0)
return pack_sf(r_sign, 0, 0);
a_mant = normalize_subnormal_sf(&a_exp, a_mant);
} else {
a_mant |= (F_UINT)1 << MANT_SIZE;
}
r_exp = a_exp - b_exp + (1 << (EXP_SIZE - 1)) - 1;
r_mant = divrem_u(&r, a_mant, 0, b_mant << 2);
if (r != 0)
r_mant |= 1;
return normalize_sf(r_sign, r_exp, r_mant, rm FFLAGS_ARG);
}
#ifdef F_ULONG
static int sqrtrem_u(F_UINT *pr, F_UINT ah, F_UINT al)
{
F_ULONG a, u, s;
int l, inexact;
if (ah != 0) {
l = 2 * F_SIZE - clz(ah - 1);
} else {
if (al == 0) {
*pr = 0;
return 0;
}
l = F_SIZE - clz(al - 1);
}
a = ((F_ULONG)ah << F_SIZE) | al;
u = (F_ULONG)1 << ((l + 1) / 2);
for(;;) {
s = u;
u = ((a / s) + s) / 2;
if (u >= s)
break;
}
inexact = (a - s * s) != 0;
*pr = s;
return inexact;
}
#else
static int sqrtrem_u(F_UINT *pr, F_UINT a1, F_UINT a0)
{
int l, inexact;
F_UINT u, s, r, q, sq0, sq1;
if (a1 != 0) {
l = 2 * F_SIZE - clz(a1 - 1);
} else {
if (a0 == 0) {
*pr = 0;
return 0;
}
l = F_SIZE - clz(a0 - 1);
}
u = (F_UINT)1 << ((l + 1) / 2);
for(;;) {
s = u;
q = divrem_u(&r, a1, a0, s);
u = (q + s) / 2;
if (u >= s)
break;
}
sq1 = mul_u(&sq0, s, s);
inexact = (sq0 != a0 || sq1 != a1);
*pr = s;
return inexact;
}
#endif
F_STATIC F_UINT sqrt_sf(F_UINT a, RoundingModeEnum rm FFLAGS_PARAM)
{
uint32_t a_sign;
int32_t a_exp;
F_UINT a_mant;
a_sign = a >> (F_SIZE - 1);
a_exp = (a >> MANT_SIZE) & EXP_MASK;
a_mant = a & MANT_MASK;
if (a_exp == EXP_MASK) {
if (a_mant != 0) {
#if F_USE_FFLAGS
if (issignan_sf(a)) {
*pfflags |= FFLAG_INVALID_OP;
}
#endif
return F_QNAN;
} else if (a_sign) {
goto neg_error;
} else {
return a;
}
}
if (a_sign) {
if (a_exp == 0 && a_mant == 0)
return a;
neg_error:
#if F_USE_FFLAGS
*pfflags |= FFLAG_INVALID_OP;
#endif
return F_QNAN;
}
if (a_exp == 0) {
if (a_mant == 0)
return pack_sf(0, 0, 0);
a_mant = normalize_subnormal_sf(&a_exp, a_mant);
} else {
a_mant |= (F_UINT)1 << MANT_SIZE;
}
a_exp -= EXP_MASK / 2;
if (a_exp & 1) {
a_exp--;
a_mant <<= 1;
}
a_exp = (a_exp >> 1) + EXP_MASK / 2;
a_mant <<= (F_SIZE - 4 - MANT_SIZE);
if (sqrtrem_u(&a_mant, a_mant, 0))
a_mant |= 1;
return normalize_sf(a_sign, a_exp, a_mant, rm FFLAGS_ARG);
}
F_STATIC int glue(eq_quiet_sf, F_SIZE)(F_UINT a, F_UINT b FFLAGS_PARAM)
{
if (isnan_sf(a) || isnan_sf(b)) {
#if F_USE_FFLAGS
if (issignan_sf(a) || issignan_sf(b)) {
*pfflags |= FFLAG_INVALID_OP;
}
#endif
return 0;
}
if ((F_UINT)((a | b) << 1) == 0)
return 1;
return (a == b);
}
F_STATIC int glue(le_sf, F_SIZE)(F_UINT a, F_UINT b FFLAGS_PARAM)
{
uint32_t a_sign, b_sign;
if (isnan_sf(a) || isnan_sf(b)) {
#if F_USE_FFLAGS
*pfflags |= FFLAG_INVALID_OP;
#endif
return 0;
}
a_sign = a >> (F_SIZE - 1);
b_sign = b >> (F_SIZE - 1);
if (a_sign != b_sign) {
return (a_sign || ((F_UINT)((a | b) << 1) == 0));
} else {
if (a_sign) {
return (a >= b);
} else {
return (a <= b);
}
}
}
F_STATIC int glue(lt_sf, F_SIZE)(F_UINT a, F_UINT b FFLAGS_PARAM)
{
uint32_t a_sign, b_sign;
if (isnan_sf(a) || isnan_sf(b)) {
#if F_USE_FFLAGS
*pfflags |= FFLAG_INVALID_OP;
#endif
return 0;
}
a_sign = a >> (F_SIZE - 1);
b_sign = b >> (F_SIZE - 1);
if (a_sign != b_sign) {
return (a_sign && ((F_UINT)((a | b) << 1) != 0));
} else {
if (a_sign) {
return (a > b);
} else {
return (a < b);
}
}
}
F_STATIC int glue(cmp_sf, F_SIZE)(F_UINT a, F_UINT b FFLAGS_PARAM)
{
uint32_t a_sign, b_sign;
if (isnan_sf(a) || isnan_sf(b)) {
#if F_USE_FFLAGS
*pfflags |= FFLAG_INVALID_OP;
#endif
return 2;
}
a_sign = a >> (F_SIZE - 1);
b_sign = b >> (F_SIZE - 1);
if (a_sign != b_sign) {
if ((F_UINT)((a | b) << 1) != 0)
return 1 - 2 * a_sign;
else
return 0;
} else {
if (a < b)
return 2 * a_sign - 1;
else if (a > b)
return 1 - 2 * a_sign;
else
return 0;
}
}
#if F_SIZE >= 64
F_STATIC F_UINT cvt_sf32_sf(uint32_t a FFLAGS_PARAM)
{
uint32_t a_sign;
int32_t a_exp;
F_UINT a_mant;
a_mant = unpack_sf32(&a_sign, &a_exp, a);
if (a_exp == 0xff) {
if (a_mant != 0) {
#if F_USE_FFLAGS
if (issignan_sf32(a)) {
*pfflags |= FFLAG_INVALID_OP;
}
#endif
return F_QNAN;
} else {
return pack_sf(a_sign, EXP_MASK, 0);
}
}
if (a_exp == 0) {
if (a_mant == 0)
return pack_sf(a_sign, 0, 0);
a_mant = normalize_subnormal_sf32(&a_exp, a_mant);
}
a_exp = a_exp - 0x7f + (EXP_MASK / 2);
a_mant <<= (MANT_SIZE - 23);
return pack_sf(a_sign, a_exp, a_mant);
}
F_STATIC uint32_t glue(glue(cvt_sf, F_SIZE), _sf32)(F_UINT a, RoundingModeEnum rm FFLAGS_PARAM)
{
uint32_t a_sign;
int32_t a_exp;
F_UINT a_mant;
a_mant = unpack_sf(&a_sign, &a_exp, a);
if (a_exp == EXP_MASK) {
if (a_mant != 0) {
#if F_USE_FFLAGS
if (issignan_sf(a)) {
*pfflags |= FFLAG_INVALID_OP;
}
#endif
return F_QNAN32;
} else {
return pack_sf32(a_sign, 0xff, 0);
}
}
if (a_exp == 0) {
if (a_mant == 0)
return pack_sf32(a_sign, 0, 0);
normalize_subnormal_sf(&a_exp, a_mant);
} else {
a_mant |= (F_UINT)1 << MANT_SIZE;
}
a_exp = a_exp - (EXP_MASK / 2) + 0x7f;
a_mant = rshift_rnd(a_mant, MANT_SIZE - (32 - 2));
return normalize_sf32(a_sign, a_exp, a_mant, rm FFLAGS_ARG);
}
#endif
#if F_SIZE >= 128
F_STATIC F_UINT cvt_sf64_sf(uint64_t a FFLAGS_PARAM)
{
uint32_t a_sign;
int32_t a_exp;
F_UINT a_mant;
a_mant = unpack_sf64(&a_sign, &a_exp, a);
if (a_exp == 0x7ff) {
if (a_mant != 0) {
#if F_USE_FFLAGS
if (issignan_sf64(a)) {
*pfflags |= FFLAG_INVALID_OP;
}
#endif
return F_QNAN;
} else {
return pack_sf(a_sign, EXP_MASK, 0);
}
}
if (a_exp == 0) {
if (a_mant == 0)
return pack_sf(a_sign, 0, 0);
a_mant = normalize_subnormal_sf64(&a_exp, a_mant);
}
a_exp = a_exp - 0x3ff + (EXP_MASK / 2);
a_mant <<= (MANT_SIZE - 52);
return pack_sf(a_sign, a_exp, a_mant);
}
F_STATIC uint64_t glue(glue(cvt_sf, F_SIZE), _sf64)(F_UINT a, RoundingModeEnum rm FFLAGS_PARAM)
{
uint32_t a_sign;
int32_t a_exp;
F_UINT a_mant;
a_mant = unpack_sf(&a_sign, &a_exp, a);
if (a_exp == EXP_MASK) {
if (a_mant != 0) {
#if F_USE_FFLAGS
if (issignan_sf(a)) {
*pfflags |= FFLAG_INVALID_OP;
}
#endif
return F_QNAN64;
} else {
return pack_sf64(a_sign, 0x7ff, 0);
}
}
if (a_exp == 0) {
if (a_mant == 0)
return pack_sf64(a_sign, 0, 0);
normalize_subnormal_sf(&a_exp, a_mant);
} else {
a_mant |= (F_UINT)1 << MANT_SIZE;
}
a_exp = a_exp - (EXP_MASK / 2) + 0x3ff;
a_mant = rshift_rnd(a_mant, MANT_SIZE - (64 - 2));
return normalize_sf64(a_sign, a_exp, a_mant, rm, pfflags);
}
#endif
#undef clz
#define ICVT_SIZE 32
#include "softfp_template_icvt.h"
#define ICVT_SIZE 64
#include "softfp_template_icvt.h"
F_STATIC F_UINT glue(fmod_sf, F_SIZE)(F_UINT a, F_UINT b FFLAGS_PARAM)
{
uint32_t a_sign;
int32_t a_exp, b_exp, n;
F_UINT a_mant, b_mant, a_abs, b_abs;
a_abs = a & ~SIGN_MASK;
b_abs = b & ~SIGN_MASK;
if (b_abs == 0 ||
a_abs >= ((F_UINT)EXP_MASK << MANT_SIZE) ||
b_abs > ((F_UINT)EXP_MASK << MANT_SIZE)) {
return F_QNAN;
}
if (a_abs < b_abs) {
return a;
} else if (a_abs == b_abs) {
return a & SIGN_MASK;
}
a_sign = a >> (F_SIZE - 1);
a_exp = (a >> MANT_SIZE) & EXP_MASK;
b_exp = (b >> MANT_SIZE) & EXP_MASK;
a_mant = (a & MANT_MASK);
b_mant = (b & MANT_MASK);
if (a_exp == 0) {
a_mant = normalize_subnormal_sf(&a_exp, a_mant);
} else {
a_mant |= (F_UINT)1 << MANT_SIZE;
}
if (b_exp == 0) {
b_mant = normalize_subnormal_sf(&b_exp, b_mant);
} else {
b_mant |= (F_UINT)1 << MANT_SIZE;
}
n = a_exp - b_exp;
if (a_mant >= b_mant)
a_mant -= b_mant;
while (n != 0) {
a_mant <<= 1;
if (a_mant >= b_mant)
a_mant -= b_mant;
n--;
}
return normalize_sf(a_sign, b_exp, a_mant << RND_SIZE, RM_RNE FFLAGS_ARG);
}
#endif
#undef F_SIZE
#undef F_UINT
#undef F_ULONG
#undef F_UHALF
#undef MANT_SIZE
#undef EXP_SIZE
#undef EXP_MASK
#undef MANT_MASK
#undef SIGN_MASK
#undef IMANT_SIZE
#undef RND_SIZE
#undef QNAN_MASK
#undef F_QNAN
#undef F_NORMALIZE_ONLY
#undef EXP_BIAS
#undef pack_sf
#undef unpack_sf
#undef rshift_rnd
#undef round_pack_sf
#undef normalize_sf
#undef normalize2_sf
#undef issignan_sf
#undef isnan_sf
#undef add_sf
#undef mul_sf
#undef fma_sf
#undef div_sf
#undef sqrt_sf
#undef normalize_subnormal_sf
#undef divrem_u
#undef sqrtrem_u
#undef mul_u
#undef cvt_sf32_sf
#undef cvt_sf64_sf