/* Copyright (C) 2010 Sebastian Pancratz Copyright (C) 2010 William Hart Copyright (C) 2012 Lina Kulakova This file is part of FLINT. FLINT is free software: you can redistribute it and/or modify it under the terms of the GNU Lesser General Public License (LGPL) as published by the Free Software Foundation; either version 2.1 of the License, or (at your option) any later version. See . */ #include #include #include "flint.h" #include "fmpz_vec.h" #include "fmpz_mod_poly.h" void _fmpz_mod_poly_pow_trunc_binexp(fmpz * res, const fmpz * poly, ulong e, slong trunc, const fmpz_t p) { ulong bit = ~((~UWORD(0)) >> 1); fmpz * v = _fmpz_vec_init(trunc); fmpz * R, * S, * T; /* Set bits to the bitmask with a 1 one place lower than the msb of e */ while ((bit & e) == UWORD(0)) bit >>= 1; bit >>= 1; /* Trial run without any polynomial arithmetic to determine the parity of the number of swaps; then set R and S accordingly */ { unsigned int swaps = 0U; ulong bit2 = bit; if ((bit2 & e)) swaps = ~swaps; while (bit2 >>= 1) if ((bit2 & e) == UWORD(0)) swaps = ~swaps; if (swaps == 0U) { R = res; S = v; } else { R = v; S = res; } } /* We unroll the first step of the loop, referring to {poly, len} */ _fmpz_mod_poly_mullow(R, poly, trunc, poly, trunc, p, trunc); if ((bit & e)) { _fmpz_mod_poly_mullow(S, R, trunc, poly, trunc, p, trunc); T = R; R = S; S = T; } while ((bit >>= 1)) { if ((bit & e)) { _fmpz_mod_poly_mullow(S, R, trunc, R, trunc, p, trunc); _fmpz_mod_poly_mullow(R, S, trunc, poly, trunc, p, trunc); } else { _fmpz_mod_poly_mullow(S, R, trunc, R, trunc, p, trunc); T = R; R = S; S = T; } } _fmpz_vec_clear(v, trunc); } void fmpz_mod_poly_pow_trunc_binexp(fmpz_mod_poly_t res, const fmpz_mod_poly_t poly, ulong e, slong trunc, const fmpz_mod_ctx_t ctx) { const slong len = poly->length; fmpz * q; int qcopy = 0; if (len < 2 || e < UWORD(3) || trunc == 0) { if (len == 0 || trunc == 0) { fmpz_mod_poly_zero(res, ctx); } else if (len == 1) { fmpz_mod_poly_fit_length(res, 1, ctx); fmpz_powm_ui(res->coeffs, poly->coeffs, e, fmpz_mod_ctx_modulus(ctx)); _fmpz_mod_poly_set_length(res, 1); _fmpz_mod_poly_normalise(res); } else if (e == UWORD(0)) { fmpz_mod_poly_set_coeff_ui(res, 0, UWORD(1), ctx); _fmpz_mod_poly_set_length(res, 1); _fmpz_mod_poly_normalise(res); } else if (e == UWORD(1)) { fmpz_mod_poly_set(res, poly, ctx); fmpz_mod_poly_truncate(res, trunc, ctx); } else /* e == UWORD(2) */ fmpz_mod_poly_mullow(res, poly, poly, trunc, ctx); return; } if (poly->length < trunc) { q = _fmpz_vec_init(trunc); _fmpz_vec_set(q, poly->coeffs, poly->length); _fmpz_vec_zero(q + poly->length, trunc - poly->length); qcopy = 1; } else q = poly->coeffs; if (res != poly || qcopy) { fmpz_mod_poly_fit_length(res, trunc, ctx); _fmpz_mod_poly_pow_trunc_binexp(res->coeffs, q, e, trunc, fmpz_mod_ctx_modulus(ctx)); } else { fmpz_mod_poly_t t; fmpz_mod_poly_init2(t, trunc, ctx); _fmpz_mod_poly_pow_trunc_binexp(t->coeffs, q, e, trunc, fmpz_mod_ctx_modulus(ctx)); fmpz_mod_poly_swap(res, t, ctx); fmpz_mod_poly_clear(t, ctx); } if (qcopy) _fmpz_vec_clear(q, trunc); _fmpz_mod_poly_set_length(res, trunc); _fmpz_mod_poly_normalise(res); }