/*
Copyright (C) 2011 William Hart
Copyright (C) 2011 Fredrik Johansson
This file is part of FLINT.
FLINT is free software: you can redistribute it and/or modify it under
the terms of the GNU Lesser General Public License (LGPL) as published
by the Free Software Foundation; either version 2.1 of the License, or
(at your option) any later version. See .
*/
#include
#include "nmod_poly.h"
#include "ulong_extras.h"
static void
__nmod_poly_invsqrt_series_prealloc(mp_ptr g,
mp_srcptr h, mp_ptr t, mp_ptr u,
slong n, nmod_t mod)
{
const int alloc = (t == NULL);
const slong m = (n + 1) / 2;
mp_limb_t c;
if (n == 1)
{
g[0] = UWORD(1);
return;
}
if (alloc)
{
t = _nmod_vec_init(n);
u = _nmod_vec_init(n);
}
__nmod_poly_invsqrt_series_prealloc(g, h, t, u, m, mod);
_nmod_vec_zero(g + m, n - m);
_nmod_poly_mul(t, g, m, g, m, mod);
if (2*m - 1 < n)
t[n-1] = UWORD(0);
_nmod_poly_mullow(u, t, n, g, n, n, mod);
_nmod_poly_mullow(t, u, n, h, n, n, mod);
c = n_invmod(mod.n - 2, mod.n);
_nmod_vec_scalar_mul_nmod(g + m, t + m, n - m, c, mod);
if (alloc)
{
_nmod_vec_clear(t);
_nmod_vec_clear(u);
}
}
void _nmod_poly_invsqrt_series(mp_ptr g, mp_srcptr h, slong n, nmod_t mod)
{
__nmod_poly_invsqrt_series_prealloc(g, h, NULL, NULL, n, mod);
}
void nmod_poly_invsqrt_series(nmod_poly_t g, const nmod_poly_t h, slong n)
{
const slong hlen = h->length;
mp_ptr g_coeffs, h_coeffs;
nmod_poly_t t1;
if (n == 0 || h->length == 0 || h->coeffs[0] == 0)
{
flint_printf("Exception (nmod_poly_invsqrt). Division by zero.\n");
flint_abort();
}
if (h->coeffs[0] != UWORD(1))
{
flint_printf("Exception (nmod_poly_invsqrt_series). Constant term != 1.\n");
flint_abort();
}
if (hlen < n)
{
h_coeffs = _nmod_vec_init(n);
flint_mpn_copyi(h_coeffs, h->coeffs, hlen);
flint_mpn_zero(h_coeffs + hlen, n - hlen);
}
else
h_coeffs = h->coeffs;
if (h == g && hlen >= n)
{
nmod_poly_init2(t1, h->mod.n, n);
g_coeffs = t1->coeffs;
}
else
{
nmod_poly_fit_length(g, n);
g_coeffs = g->coeffs;
}
_nmod_poly_invsqrt_series(g_coeffs, h_coeffs, n, h->mod);
if (h == g && hlen >= n)
{
nmod_poly_swap(g, t1);
nmod_poly_clear(t1);
}
g->length = n;
if (hlen < n)
_nmod_vec_clear(h_coeffs);
_nmod_poly_normalise(g);
}