#include "ulong_extras.h"
#include "fmpz.h"
#include "fmpz_vec.h"
#include "fmpq_poly.h"
#define Ri(ii) (R + (n-1)*((ii)-1))
#define Rdeni(ii) (Rden + ii - 1)
static void
_set_vec(fmpz * rnum, fmpz_t den,
const fmpz * xnum, const fmpz * xden, slong len)
{
slong j;
fmpz_t t;
fmpz_init(t);
fmpz_one(den);
for (j = 0; j < len; j++)
fmpz_lcm(den, den, xden + j);
for (j = 0; j < len; j++)
{
fmpz_divexact(t, den, xden + j);
fmpz_mul(rnum + j, xnum + j, t);
}
fmpz_clear(t);
}
void
_fmpq_poly_revert_series_lagrange_fast(fmpz * Qinv, fmpz_t den,
const fmpz * Q, const fmpz_t Qden, slong Qlen, slong n)
{
slong i, j, m;
fmpz *R, *Rden, *S, *T, *dens, *tmp;
fmpz_t Sden, Tden;
if (Qlen <= 2)
{
fmpz_zero(Qinv);
if (Qlen == 2)
{
fmpz_set(Qinv + 1, Qden);
fmpz_set(den, Q + 1);
_fmpq_poly_canonicalise(Qinv, den, 2);
}
_fmpz_vec_zero(Qinv + 2, n - 2);
return;
}
m = n_sqrt(n);
dens = _fmpz_vec_init(n);
R = _fmpz_vec_init((n - 1) * m);
S = _fmpz_vec_init(n - 1);
T = _fmpz_vec_init(n - 1);
Rden = _fmpz_vec_init(m);
fmpz_init(Sden);
fmpz_init(Tden);
fmpz_zero(Qinv);
fmpz_one(dens);
_fmpq_poly_inv_series(Ri(1), Rdeni(1), Q + 1, Qden, Qlen - 1, n - 1);
_fmpq_poly_canonicalise(Ri(1), Rdeni(1), n - 1);
for (i = 2; i <= m; i++)
{
_fmpq_poly_mullow(Ri(i), Rdeni(i), Ri(i-1), Rdeni(i-1), n - 1,
Ri(1), Rdeni(1), n - 1, n - 1);
_fmpq_poly_canonicalise(Ri(i), Rdeni(i), n - 1);
}
for (i = 1; i < m; i++)
{
fmpz_set(Qinv + i, Ri(i) + i - 1);
fmpz_mul_ui(dens + i, Rdeni(i), i);
}
_fmpz_vec_set(S, Ri(m), n - 1);
fmpz_set(Sden, Rdeni(m));
for (i = m; i < n; i += m)
{
fmpz_set(Qinv + i, S + i - 1);
fmpz_mul_ui(dens + i, Sden, i);
for (j = 1; j < m && i + j < n; j++)
{
_fmpz_vec_dot_general(Qinv + i + j, NULL, 0, S, Ri(j), 1, i + j);
fmpz_mul(dens + i + j, Sden, Rdeni(j));
fmpz_mul_ui(dens + i + j, dens + i + j, i + j);
}
if (i + 1 < n)
{
_fmpq_poly_mullow(T, Tden, S, Sden, n - 1,
Ri(m), Rdeni(m), n - 1, n - 1);
_fmpq_poly_canonicalise(T, Tden, n - 1);
fmpz_swap(Tden, Sden);
tmp = S; S = T; T = tmp;
}
}
_set_vec(Qinv, den, Qinv, dens, n);
_fmpq_poly_canonicalise(Qinv, den, n);
_fmpz_vec_clear(dens, n);
_fmpz_vec_clear(R, (n - 1) * m);
_fmpz_vec_clear(S, n - 1);
_fmpz_vec_clear(T, n - 1);
_fmpz_vec_clear(Rden, m);
fmpz_clear(Sden);
fmpz_clear(Tden);
}
void
fmpq_poly_revert_series_lagrange_fast(fmpq_poly_t res,
const fmpq_poly_t poly, slong n)
{
if (poly->length < 2 || !fmpz_is_zero(poly->coeffs)
|| fmpz_is_zero(poly->coeffs + 1))
{
flint_throw(FLINT_ERROR, "(fmpq_poly_revert_series_lagrange_fast): Input must "
"have zero constant term and nonzero coefficient of x^1.\n");
}
if (n < 2)
{
fmpq_poly_zero(res);
return;
}
if (res != poly)
{
fmpq_poly_fit_length(res, n);
_fmpq_poly_revert_series_lagrange_fast(res->coeffs,
res->den, poly->coeffs, poly->den, poly->length, n);
}
else
{
fmpq_poly_t t;
fmpq_poly_init2(t, n);
_fmpq_poly_revert_series_lagrange_fast(t->coeffs,
t->den, poly->coeffs, poly->den, poly->length, n);
fmpq_poly_swap(res, t);
fmpq_poly_clear(t);
}
_fmpq_poly_set_length(res, n);
_fmpq_poly_normalise(res);
}