#include "ulong_extras.h"
#include "mpn_extras.h"
#include "nmod_vec.h"
#include "nmod_poly.h"
#include "nmod_mat.h"
void
_nmod_poly_compose_mod_brent_kung_vec_preinv(nmod_poly_struct * res,
const nmod_poly_struct * polys, slong FLINT_UNUSED(lenpolys), slong l,
nn_srcptr g, slong glen, nn_srcptr poly, slong len,
nn_srcptr polyinv, slong leninv, nmod_t mod)
{
nmod_mat_t A, B, C;
nn_ptr t, h;
slong i, j, k, n, m, len2 = l, len1;
n = len - 1;
m = n_sqrt(n*len2) + 1;
h = _nmod_vec_init(n);
t = _nmod_vec_init(n);
k = len/m + 1;
nmod_mat_init(A, m, n, mod.n);
nmod_mat_init(B, k*len2, m, mod.n);
nmod_mat_init(C, k*len2, n, mod.n);
for (j = 0; j < len2; j++)
{
len1 = (polys + j)->length;
for (i = 0; i < len1/m; i++)
_nmod_vec_set(nmod_mat_entry_ptr(B, i + j*k, 0), (polys + j)->coeffs + i*m, m);
_nmod_vec_set(nmod_mat_entry_ptr(B, i + j*k, 0), (polys + j)->coeffs + i*m, len1%m);
}
{
nn_ptr * Arows;
slong i;
Arows = flint_malloc(sizeof(nn_ptr) * A->r);
for (i = 0; i < A->r; i++)
Arows[i] = nmod_mat_entry_ptr(A, i, 0);
_nmod_poly_powers_mod_preinv_naive(Arows, g, glen,
m, poly, len, polyinv, leninv, mod);
flint_free(Arows);
}
nmod_mat_mul(C, B, A);
_nmod_poly_mulmod_preinv(h, nmod_mat_entry_ptr(A, m - 1, 0), n, nmod_mat_entry_ptr(A, 1, 0), n, poly,
len, polyinv, leninv, mod);
for (j = 0; j < len2; j++)
{
nmod_mat_t Cw;
nmod_mat_window_init(Cw, C, j * k, 0, (j + 1) * k, C->c);
_nmod_poly_mod_matrix_rows_evaluate(res[j].coeffs, Cw, h, n, poly, len, polyinv, leninv, mod);
}
_nmod_vec_clear(h);
_nmod_vec_clear(t);
nmod_mat_clear(A);
nmod_mat_clear(B);
nmod_mat_clear(C);
}
void
nmod_poly_compose_mod_brent_kung_vec_preinv(nmod_poly_struct * res,
const nmod_poly_struct * polys, slong len1, slong n,
const nmod_poly_t g, const nmod_poly_t poly, const nmod_poly_t polyinv)
{
slong len2 = poly->length;
slong len3, i;
for (i = 0; i < len1; i++)
{
len3 = (polys + i)->length;
if (len3 >= len2)
{
flint_throw(FLINT_ERROR, "(nmod_poly_compose_mod_brent_kung_vec_preinv): "
"The degree of the first polynomial must be smaller than that of the modulus\n");
}
}
if (n > len1)
{
flint_throw(FLINT_ERROR, "(nmod_poly_compose_mod_brent_kung_vec_preinv): "
"n is larger than the length of polys\n");
}
if (n == 0)
return;
if (len2 == 1)
{
for (i = 0; i < n; i++)
nmod_poly_zero(res + i);
return;
}
if (len2 == 2)
{
for (i = 0; i < n; i++)
nmod_poly_set(res + i, polys + i);
return;
}
for (i = 0; i < n; i++)
{
nmod_poly_fit_length(res + i, len2 - 1);
_nmod_poly_set_length(res + i, len2 - 1);
}
_nmod_poly_compose_mod_brent_kung_vec_preinv(res, polys, len1, n,
g->coeffs, g->length, poly->coeffs, len2, polyinv->coeffs,
polyinv->length, poly->mod);
for (i = 0; i < n; i++)
_nmod_poly_normalise(res + i);
}