#include "nmod_vec.h"
#include "nmod_poly.h"
#define MAX_NZ 6
static int
_nmod_poly_divrem_try_sparse(nn_ptr Q, nn_ptr R, nn_srcptr A,
slong lenA, nn_srcptr B, slong lenB,
nn_srcptr Binv, slong FLINT_UNUSED(lenBinv), nmod_t mod)
{
slong nz, i, j, k;
slong exps[MAX_NZ];
ulong coeffs[MAX_NZ];
slong n = lenB - 1;
ulong c, leadB;
ulong negcbound;
nn_ptr r;
nz = 1;
for (i = 0; i < lenB - 1; i++)
{
if (B[i] != 0)
{
exps[nz - 1] = i;
coeffs[nz - 1] = mod.n - B[i];
nz++;
if (nz > MAX_NZ)
return 0;
}
}
leadB = B[lenB - 1];
if (leadB != 1)
_nmod_vec_scalar_mul_nmod(coeffs, coeffs, nz - 1, Binv[0], mod);
negcbound = 0;
for (i = 0; i < nz - 1; i++)
negcbound |= (mod.n - coeffs[i]);
TMP_INIT;
TMP_START;
r = TMP_ALLOC((lenA) * sizeof(ulong));
_nmod_vec_set(r, A, lenA);
if (mod.n == 2)
{
for (i = lenA - 1; i >= n; i--)
{
Q[i - n] = c = r[i];
for (k = nz - 2; k >= 0; k--)
{
j = exps[k];
r[j + i - n] ^= c;
}
}
}
else if (negcbound == 1)
{
for (i = lenA - 1; i >= n; i--)
{
Q[i - n] = c = r[i];
for (k = nz - 2; k >= 0; k--)
{
j = exps[k];
r[j + i - n] = nmod_sub(r[j + i - n], c, mod);
}
}
}
else if (NMOD_BITS(mod) < FLINT_BITS / 2)
{
ulong ninv = n_barrett_precomp(mod.n);
for (i = lenA - 1; i >= n; i--)
{
Q[i - n] = c = r[i];
for (k = nz - 2; k >= 0; k--)
{
j = exps[k];
r[j + i - n] = n_mod_barrett(r[j + i - n] + c * coeffs[k], mod.n, ninv);
}
}
}
else
{
for (i = lenA - 1; i >= n; i--)
{
Q[i - n] = c = r[i];
for (k = nz - 2; k >= 0; k--)
{
j = exps[k];
r[j + i - n] = nmod_addmul(r[j + i - n], c, coeffs[k], mod);
}
}
}
if (leadB != 1)
_nmod_vec_scalar_mul_nmod(Q, Q, lenA - lenB + 1, Binv[0], mod);
_nmod_vec_set(R, r, n);
TMP_END;
return 1;
}
void _nmod_poly_divrem_newton_n_preinv(nn_ptr Q, nn_ptr R, nn_srcptr A,
slong lenA, nn_srcptr B, slong lenB,
nn_srcptr Binv, slong lenBinv, nmod_t mod)
{
const slong lenQ = lenA - lenB + 1;
if (lenA == lenB + 1)
{
_nmod_poly_divrem_basecase_preinv1(Q, R, A, lenA, B, lenB, Binv[0], mod);
return;
}
if (lenB > 20 && _nmod_poly_divrem_try_sparse(Q, R, A, lenA, B, lenB, Binv, lenBinv, mod))
return;
_nmod_poly_div_newton_n_preinv(Q, A, lenA, B, lenB, Binv, lenBinv, mod);
if (lenB > 1)
{
if (lenQ >= lenB - 1)
_nmod_poly_mullow(R, Q, lenQ, B, lenB - 1, lenB - 1, mod);
else
_nmod_poly_mullow(R, B, lenB - 1, Q, lenQ, lenB - 1, mod);
_nmod_vec_sub(R, A, R, lenB - 1, mod);
}
}
void nmod_poly_divrem_newton_n_preinv(nmod_poly_t Q, nmod_poly_t R,
const nmod_poly_t A, const nmod_poly_t B,
const nmod_poly_t Binv)
{
const slong lenA = A->length, lenB = B->length, lenBinv = Binv->length;
nn_ptr q, r;
if (lenB == 0)
{
if (nmod_poly_modulus(B) == 1)
{
nmod_poly_set(Q, A);
nmod_poly_zero(R);
return;
} else
{
flint_throw(FLINT_DIVZERO, "Exception (nmod_poly_divrem_newton_n_preinv). Division by zero.\n");
}
}
if (lenA < lenB)
{
nmod_poly_set(R, A);
nmod_poly_zero(Q);
return;
}
if (lenA > 2 * lenB - 1)
{
flint_printf ("Exception (nmod_poly_divrem_newton_n_preinv).\n");
}
if (Q == A || Q == B || Q == Binv)
{
q = _nmod_vec_init(lenA - lenB + 1);
}
else
{
nmod_poly_fit_length(Q, lenA - lenB + 1);
q = Q->coeffs;
}
if (R == A || R == B || R == Binv)
{
r = _nmod_vec_init(lenB - 1);
}
else
{
nmod_poly_fit_length(R, lenB - 1);
r = R->coeffs;
}
_nmod_poly_divrem_newton_n_preinv(q, r, A->coeffs, lenA,
B->coeffs, lenB, Binv->coeffs, lenBinv, B->mod);
if (Q == A || Q == B || Q == Binv)
{
_nmod_vec_clear(Q->coeffs);
Q->coeffs = q;
Q->alloc = lenA - lenB + 1;
}
if (R == A || R == B || R == Binv)
{
_nmod_vec_clear(R->coeffs);
R->coeffs = r;
R->alloc = lenB - 1;
}
Q->length = lenA - lenB + 1;
R->length = lenB - 1;
_nmod_poly_normalise(R);
}