#include "test_helpers.h"
#include "gmpcompat.h"
#include "mpn_extras.h"
#include "fft.h"
#ifndef set_p
#define set_p set_p
void set_p(mpz_t p, mp_size_t n, flint_bitcnt_t w)
{
flint_mpz_set_ui(p, 1);
mpz_mul_2exp(p, p, n*w);
flint_mpz_add_ui(p, p, 1);
}
#endif
void ref_fft_butterfly(mpz_t s, mpz_t t, mpz_t i1, mpz_t i2,
mpz_t p, mp_size_t i, mp_size_t w)
{
mpz_add(s, i1, i2);
mpz_sub(t, i1, i2);
mpz_mul_2exp(t, t, i*w);
mpz_mod(s, s, p);
mpz_mod(t, t, p);
}
void ref_ifft_butterfly(mpz_t s, mpz_t t, mpz_t i1, mpz_t i2,
mpz_t p, mp_size_t i, mp_size_t n, mp_size_t w)
{
mpz_mul_2exp(i2, i2, 2*n*w - i*w);
mpz_add(s, i1, i2);
mpz_sub(t, i1, i2);
mpz_mod(s, s, p);
mpz_mod(t, t, p);
}
TEST_FUNCTION_START(fft_ifft_butterfly, state)
{
mp_size_t c, bits, j, k, n, w, limbs;
mpz_t p, ma, mb, m2a, m2b, mn1, mn2;
mp_limb_t * nn1, * nn2, * r1, * r2;
mpz_init(p);
mpz_init(ma);
mpz_init(mb);
mpz_init(m2a);
mpz_init(m2b);
mpz_init(mn1);
mpz_init(mn2);
for (bits = FLINT_BITS; bits < 20*FLINT_BITS; bits += FLINT_BITS)
{
for (j = 1; j < 10; j++)
{
for (k = 1; k <= FLINT_BITS; k <<= 1)
{
n = bits/k;
w = j*k;
limbs = (n*w)/FLINT_BITS;
for (c = 0; c < n; c++)
{
if (n_randint(state, 100) > 2.0 + flint_test_multiplier() * 10)
continue;
nn1 = flint_malloc((limbs + 1)*sizeof(mp_limb_t));
nn2 = flint_malloc((limbs + 1)*sizeof(mp_limb_t));
r1 = flint_malloc((limbs + 1)*sizeof(mp_limb_t));
r2 = flint_malloc((limbs + 1)*sizeof(mp_limb_t));
random_fermat(nn1, state, limbs);
random_fermat(nn2, state, limbs);
fermat_to_mpz(mn1, nn1, limbs);
fermat_to_mpz(mn2, nn2, limbs);
set_p(p, n, w);
fft_butterfly(r1, r2, nn1, nn2, c, limbs, w);
fermat_to_mpz(m2a, r1, limbs);
fermat_to_mpz(m2b, r2, limbs);
mpz_mod(m2a, m2a, p);
mpz_mod(m2b, m2b, p);
ref_fft_butterfly(ma, mb, mn1, mn2, p, c, w);
if (mpz_cmp(ma, m2a) != 0)
{
flint_printf("FAIL:\n");
flint_printf("fft_butterfly error a\n");
flint_printf("limbs = %wd\n", limbs);
flint_printf("n = %wd, w = %wd, k = %wd, c = %wd\n", n, w, k, c);
gmp_printf("want %Zx\n\n", ma);
gmp_printf("got %Zx\n", m2a);
fflush(stdout);
flint_abort();
}
if (mpz_cmp(mb, m2b) != 0)
{
flint_printf("FAIL:\n");
flint_printf("fft_butterfly error b\n");
flint_printf("limbs = %wd\n", limbs);
flint_printf("n = %wd, w = %wd, k = %wd, c = %wd\n", n, w, k, c);
gmp_printf("want %Zx\n\n", mb);
gmp_printf("got %Zx\n", m2b);
fflush(stdout);
flint_abort();
}
flint_free(nn1);
flint_free(nn2);
flint_free(r1);
flint_free(r2);
}
}
}
}
for (bits = FLINT_BITS; bits < 20*FLINT_BITS; bits += FLINT_BITS)
{
for (j = 1; j < 10; j++)
{
for (k = 1; k <= FLINT_BITS; k <<= 1)
{
n = bits/k;
w = j*k;
limbs = (n*w)/FLINT_BITS;
for (c = 0; c < n; c++)
{
if (n_randint(state, 100) > 2.0 + flint_test_multiplier() * 10)
continue;
nn1 = flint_malloc((limbs + 1)*sizeof(mp_limb_t));
nn2 = flint_malloc((limbs + 1)*sizeof(mp_limb_t));
r1 = flint_malloc((limbs + 1)*sizeof(mp_limb_t));
r2 = flint_malloc((limbs + 1)*sizeof(mp_limb_t));
random_fermat(nn1, state, limbs);
random_fermat(nn2, state, limbs);
fermat_to_mpz(mn1, nn1, limbs);
fermat_to_mpz(mn2, nn2, limbs);
set_p(p, n, w);
ifft_butterfly(r1, r2, nn1, nn2, c, limbs, w);
fermat_to_mpz(m2a, r1, limbs);
fermat_to_mpz(m2b, r2, limbs);
mpz_mod(m2a, m2a, p);
mpz_mod(m2b, m2b, p);
ref_ifft_butterfly(ma, mb, mn1, mn2, p, c, n, w);
if (mpz_cmp(ma, m2a) != 0)
{
flint_printf("FAIL:\n");
flint_printf("ifft_butterfly error a\n");
flint_printf("limbs = %wd\n", limbs);
flint_printf("n = %wd, w = %wd, k = %wd, c = %wd\n", n, w, k, c);
gmp_printf("want %Zx\n\n", ma);
gmp_printf("got %Zx\n", m2a);
fflush(stdout);
flint_abort();
}
if (mpz_cmp(mb, m2b) != 0)
{
flint_printf("FAIL:\n");
flint_printf("ifft_butterfly error b\n");
flint_printf("limbs = %wd\n", limbs);
flint_printf("n = %wd, w = %wd, k = %wd, c = %wd\n", n, w, k, c);
gmp_printf("want %Zx\n\n", mb);
gmp_printf("got %Zx\n", m2b);
fflush(stdout);
flint_abort();
}
flint_free(nn1);
flint_free(nn2);
flint_free(r1);
flint_free(r2);
}
}
}
}
mpz_clear(p);
mpz_clear(ma);
mpz_clear(mb);
mpz_clear(m2a);
mpz_clear(m2b);
mpz_clear(mn1);
mpz_clear(mn2);
TEST_FUNCTION_END(state);
}