#include "mpn_extras.h"
#include "nmod.h"
#include "nmod_vec.h"
#include "nmod_poly.h"
#include "gr_poly.h"
static const short nmod_poly_xgcd_hgcd_cutoff_tab[64] = {
159, 89, 75, 85, 72, 78, 81, 89, 85, 89, 93, 97, 97, 93, 101, 97, 97,
106, 106, 121, 111, 101, 101, 101, 106, 106, 106, 101, 106, 182, 191, 191,
200, 231, 200, 191, 220, 210, 210, 231, 231, 220, 210, 220, 242, 210, 231,
220, 254, 254, 242, 242, 242, 254, 306, 306, 266, 306, 292, 306, 321, 306,
388, 166,
};
slong nmod_poly_xgcd_hgcd_cutoff(nmod_t mod)
{
return nmod_poly_xgcd_hgcd_cutoff_tab[NMOD_BITS(mod) - 1];
}
slong _nmod_poly_xgcd(nn_ptr G, nn_ptr S, nn_ptr T,
nn_srcptr A, slong lenA, nn_srcptr B, slong lenB, nmod_t mod)
{
slong cutoff = nmod_poly_xgcd_hgcd_cutoff(mod);
if (lenB < cutoff)
{
return _nmod_poly_xgcd_euclidean(G, S, T, A, lenA, B, lenB, mod);
}
else
{
slong inner_cutoff = nmod_poly_hgcd_iter_recursive_cutoff(mod);
slong lenG = 0;
gr_ctx_t ctx;
_gr_ctx_init_nmod(ctx, &mod);
GR_MUST_SUCCEED(_gr_poly_xgcd_hgcd(&lenG, G, S, T, A, lenA, B, lenB, inner_cutoff, cutoff, ctx));
return lenG;
}
}
void
nmod_poly_xgcd(nmod_poly_t G, nmod_poly_t S, nmod_poly_t T,
const nmod_poly_t A, const nmod_poly_t B)
{
if (A->length < B->length)
{
nmod_poly_xgcd(G, T, S, B, A);
}
else
{
const slong lenA = A->length, lenB = B->length;
ulong inv;
if (lenA == 0)
{
nmod_poly_zero(G);
nmod_poly_zero(S);
nmod_poly_zero(T);
}
else if (lenB == 0)
{
inv = n_invmod(A->coeffs[lenA - 1], A->mod.n);
nmod_poly_scalar_mul_nmod(G, A, inv);
nmod_poly_zero(T);
nmod_poly_set_coeff_ui(S, 0, inv);
S->length = 1;
}
else if (lenB == 1)
{
nmod_poly_fit_length(T, 1);
T->length = 1;
T->coeffs[0] = n_invmod(B->coeffs[0], A->mod.n);
nmod_poly_one(G);
nmod_poly_zero(S);
}
else
{
nn_ptr g, s, t;
slong lenG;
if (G == A || G == B)
{
g = _nmod_vec_init(FLINT_MIN(lenA, lenB));
}
else
{
nmod_poly_fit_length(G, FLINT_MIN(lenA, lenB));
g = G->coeffs;
}
if (S == A || S == B)
{
s = _nmod_vec_init(lenB - 1);
}
else
{
nmod_poly_fit_length(S, lenB - 1);
s = S->coeffs;
}
if (T == A || T == B)
{
t = _nmod_vec_init(lenA - 1);
}
else
{
nmod_poly_fit_length(T, lenA - 1);
t = T->coeffs;
}
if (lenA >= lenB)
lenG = _nmod_poly_xgcd(g, s, t, A->coeffs, lenA,
B->coeffs, lenB, A->mod);
else
lenG = _nmod_poly_xgcd(g, t, s, B->coeffs, lenB,
A->coeffs, lenA, A->mod);
if (G == A || G == B)
{
flint_free(G->coeffs);
G->coeffs = g;
G->alloc = FLINT_MIN(lenA, lenB);
}
if (S == A || S == B)
{
flint_free(S->coeffs);
S->coeffs = s;
S->alloc = lenB - 1;
}
if (T == A || T == B)
{
flint_free(T->coeffs);
T->coeffs = t;
T->alloc = lenA - 1;
}
G->length = lenG;
S->length = FLINT_MAX(lenB - lenG, 1);
T->length = FLINT_MAX(lenA - lenG, 1);
MPN_NORM(S->coeffs, S->length);
MPN_NORM(T->coeffs, T->length);
if (G->coeffs[lenG - 1] != 1)
{
inv = n_invmod(G->coeffs[lenG - 1], A->mod.n);
nmod_poly_scalar_mul_nmod(G, G, inv);
nmod_poly_scalar_mul_nmod(S, S, inv);
nmod_poly_scalar_mul_nmod(T, T, inv);
}
}
}
}
slong _nmod_poly_xgcd_euclidean(nn_ptr G, nn_ptr S, nn_ptr T,
nn_srcptr A, slong lenA,
nn_srcptr B, slong lenB, nmod_t mod)
{
flint_mpn_zero(G, lenB);
flint_mpn_zero(S, lenB - 1);
flint_mpn_zero(T, lenA - 1);
if (lenB == 1)
{
G[0] = B[0];
T[0] = 1;
return 1;
}
else
{
nn_ptr Q, R;
slong lenQ, lenR, lenG;
Q = _nmod_vec_init(2 * lenA);
R = Q + lenA;
_nmod_poly_divrem(Q, R, A, lenA, B, lenB, mod);
lenR = lenB - 1;
MPN_NORM(R, lenR);
if (lenR == 0)
{
_nmod_vec_set(G, B, lenB);
T[0] = 1;
lenG = lenB;
}
else
{
nn_ptr D, U, V1, V3, W;
slong lenD, lenU, lenV1, lenV3, lenW;
W = _nmod_vec_init(FLINT_MAX(5 * lenB, lenA + lenB));
D = W + lenB;
U = D + lenB;
V1 = U + lenB;
V3 = V1 + lenB;
lenU = 0;
_nmod_vec_set(D, B, lenB);
lenD = lenB;
V1[0] = 1;
lenV1 = 1;
lenV3 = 0;
MPN_SWAP(V3, lenV3, R, lenR);
do {
_nmod_poly_divrem(Q, R, D, lenD, V3, lenV3, mod);
lenQ = lenD - lenV3 + 1;
lenR = lenV3 - 1;
MPN_NORM(R, lenR);
if (lenV1 >= lenQ)
_nmod_poly_mul(W, V1, lenV1, Q, lenQ, mod);
else
_nmod_poly_mul(W, Q, lenQ, V1, lenV1, mod);
lenW = lenQ + lenV1 - 1;
_nmod_poly_sub(U, U, lenU, W, lenW, mod);
lenU = FLINT_MAX(lenU, lenW);
MPN_NORM(U, lenU);
MPN_SWAP(U, lenU, V1, lenV1);
{
nn_ptr __t;
slong __tn;
__t = D;
D = V3;
V3 = R;
R = __t;
__tn = lenD;
lenD = lenV3;
lenV3 = lenR;
lenR = __tn;
}
} while (lenV3 != 0);
_nmod_vec_set(G, D, lenD);
_nmod_vec_set(S, U, lenU);
{
lenQ = lenA + lenU - 1;
_nmod_poly_mul(Q, A, lenA, S, lenU, mod);
_nmod_vec_neg(Q, Q, lenQ, mod);
_nmod_poly_add(Q, G, lenD, Q, lenQ, mod);
_nmod_poly_divrem(T, W, Q, lenQ, B, lenB, mod);
}
_nmod_vec_clear(W);
lenG = lenD;
}
_nmod_vec_clear(Q);
return lenG;
}
}
void
nmod_poly_xgcd_euclidean(nmod_poly_t G, nmod_poly_t S, nmod_poly_t T,
const nmod_poly_t A, const nmod_poly_t B)
{
if (A->length < B->length)
{
nmod_poly_xgcd_euclidean(G, T, S, B, A);
}
else
{
const slong lenA = A->length, lenB = B->length;
ulong inv;
if (lenA == 0)
{
nmod_poly_zero(G);
nmod_poly_zero(S);
nmod_poly_zero(T);
}
else if (lenB == 0)
{
inv = n_invmod(A->coeffs[lenA - 1], A->mod.n);
nmod_poly_scalar_mul_nmod(G, A, inv);
nmod_poly_zero(T);
nmod_poly_set_coeff_ui(S, 0, inv);
S->length = 1;
}
else if (lenB == 1)
{
nmod_poly_fit_length(T, 1);
T->length = 1;
T->coeffs[0] = n_invmod(B->coeffs[0], A->mod.n);
nmod_poly_one(G);
nmod_poly_zero(S);
}
else
{
nn_ptr g, s, t;
slong lenG;
if (G == A || G == B)
{
g = _nmod_vec_init(FLINT_MIN(lenA, lenB));
}
else
{
nmod_poly_fit_length(G, FLINT_MIN(lenA, lenB));
g = G->coeffs;
}
if (S == A || S == B)
{
s = _nmod_vec_init(lenB - 1);
}
else
{
nmod_poly_fit_length(S, lenB - 1);
s = S->coeffs;
}
if (T == A || T == B)
{
t = _nmod_vec_init(lenA - 1);
}
else
{
nmod_poly_fit_length(T, lenA - 1);
t = T->coeffs;
}
if (lenA >= lenB)
lenG = _nmod_poly_xgcd_euclidean(g, s, t, A->coeffs, lenA,
B->coeffs, lenB, A->mod);
else
lenG = _nmod_poly_xgcd_euclidean(g, t, s, B->coeffs, lenB,
A->coeffs, lenA, A->mod);
if (G == A || G == B)
{
flint_free(G->coeffs);
G->coeffs = g;
G->alloc = FLINT_MIN(lenA, lenB);
}
if (S == A || S == B)
{
flint_free(S->coeffs);
S->coeffs = s;
S->alloc = lenB - 1;
}
if (T == A || T == B)
{
flint_free(T->coeffs);
T->coeffs = t;
T->alloc = lenA - 1;
}
G->length = lenG;
S->length = FLINT_MAX(lenB - lenG, 1);
T->length = FLINT_MAX(lenA - lenG, 1);
MPN_NORM(S->coeffs, S->length);
MPN_NORM(T->coeffs, T->length);
if (G->coeffs[lenG - 1] != 1)
{
inv = n_invmod(G->coeffs[lenG - 1], A->mod.n);
nmod_poly_scalar_mul_nmod(G, G, inv);
nmod_poly_scalar_mul_nmod(S, S, inv);
nmod_poly_scalar_mul_nmod(T, T, inv);
}
}
}
}
slong _nmod_poly_xgcd_hgcd(nn_ptr G, nn_ptr S, nn_ptr T,
nn_srcptr A, slong lenA, nn_srcptr B, slong lenB, nmod_t mod)
{
slong cutoff = nmod_poly_xgcd_hgcd_cutoff(mod);
slong inner_cutoff = nmod_poly_hgcd_iter_recursive_cutoff(mod);
slong lenG = 0;
gr_ctx_t ctx;
_gr_ctx_init_nmod(ctx, &mod);
GR_MUST_SUCCEED(_gr_poly_xgcd_hgcd(&lenG, G, S, T, A, lenA, B, lenB, inner_cutoff, cutoff, ctx));
return lenG;
}
void
nmod_poly_xgcd_hgcd(nmod_poly_t G, nmod_poly_t S, nmod_poly_t T,
const nmod_poly_t A, const nmod_poly_t B)
{
if (A->length < B->length)
{
nmod_poly_xgcd_hgcd(G, T, S, B, A);
}
else
{
const slong lenA = A->length, lenB = B->length;
ulong inv;
if (lenA == 0)
{
nmod_poly_zero(G);
nmod_poly_zero(S);
nmod_poly_zero(T);
}
else if (lenB == 0)
{
inv = n_invmod(A->coeffs[lenA - 1], A->mod.n);
nmod_poly_scalar_mul_nmod(G, A, inv);
nmod_poly_zero(T);
nmod_poly_set_coeff_ui(S, 0, inv);
S->length = 1;
}
else if (lenB == 1)
{
nmod_poly_fit_length(T, 1);
T->length = 1;
T->coeffs[0] = n_invmod(B->coeffs[0], A->mod.n);
nmod_poly_one(G);
nmod_poly_zero(S);
}
else
{
nn_ptr g, s, t;
slong lenG;
if (G == A || G == B)
{
g = _nmod_vec_init(FLINT_MIN(lenA, lenB));
}
else
{
nmod_poly_fit_length(G, FLINT_MIN(lenA, lenB));
g = G->coeffs;
}
if (S == A || S == B)
{
s = _nmod_vec_init(lenB - 1);
}
else
{
nmod_poly_fit_length(S, lenB - 1);
s = S->coeffs;
}
if (T == A || T == B)
{
t = _nmod_vec_init(lenA - 1);
}
else
{
nmod_poly_fit_length(T, lenA - 1);
t = T->coeffs;
}
if (lenA >= lenB)
lenG = _nmod_poly_xgcd_hgcd(g, s, t, A->coeffs, lenA,
B->coeffs, lenB, A->mod);
else
lenG = _nmod_poly_xgcd_hgcd(g, t, s, B->coeffs, lenB,
A->coeffs, lenA, A->mod);
if (G == A || G == B)
{
flint_free(G->coeffs);
G->coeffs = g;
G->alloc = FLINT_MIN(lenA, lenB);
}
if (S == A || S == B)
{
flint_free(S->coeffs);
S->coeffs = s;
S->alloc = lenB - 1;
}
if (T == A || T == B)
{
flint_free(T->coeffs);
T->coeffs = t;
T->alloc = lenA - 1;
}
G->length = lenG;
S->length = FLINT_MAX(lenB - lenG, 1);
T->length = FLINT_MAX(lenA - lenG, 1);
MPN_NORM(S->coeffs, S->length);
MPN_NORM(T->coeffs, T->length);
if (G->coeffs[lenG - 1] != 1)
{
inv = n_invmod(G->coeffs[lenG - 1], A->mod.n);
nmod_poly_scalar_mul_nmod(G, G, inv);
nmod_poly_scalar_mul_nmod(S, S, inv);
nmod_poly_scalar_mul_nmod(T, T, inv);
}
}
}
}