/* Copyright (C) 2010, 2011 Sebastian Pancratz This file is part of FLINT. FLINT is free software: you can redistribute it and/or modify it under the terms of the GNU Lesser General Public License (LGPL) as published by the Free Software Foundation; either version 2.1 of the License, or (at your option) any later version. See . */ #include #include #include "flint.h" #include "fmpz.h" #include "fmpz_vec.h" #include "fmpz_poly.h" #include "fmpz_mod_poly.h" void _fmpz_mod_poly_pow(fmpz *res, const fmpz *poly, slong len, ulong e, const fmpz_t p) { ulong bit = ~((~UWORD(0)) >> 1); slong rlen; slong alloc = (slong) e * (len - 1) + 1; fmpz *v = _fmpz_vec_init(alloc); fmpz *R, *S, *T; /* Set bits to the bitmask with a 1 one place lower than the msb of e */ while ((bit & e) == UWORD(0)) bit >>= 1; bit >>= 1; /* Trial run without any polynomial arithmetic to determine the parity of the number of swaps; then set R and S accordingly */ { unsigned int swaps = 0U; ulong bit2 = bit; if ((bit2 & e)) swaps = ~swaps; while (bit2 >>= 1) if ((bit2 & e) == UWORD(0)) swaps = ~swaps; if (swaps == 0U) { R = res; S = v; } else { R = v; S = res; } } /* We unroll the first step of the loop, referring to {poly, len} */ _fmpz_mod_poly_sqr(R, poly, len, p); rlen = 2 * len - 1; if ((bit & e)) { _fmpz_mod_poly_mul(S, R, rlen, poly, len, p); rlen += len - 1; T = R; R = S; S = T; } while ((bit >>= 1)) { if ((bit & e)) { _fmpz_mod_poly_sqr(S, R, rlen, p); rlen += rlen - 1; _fmpz_mod_poly_mul(R, S, rlen, poly, len, p); rlen += len - 1; } else { _fmpz_mod_poly_sqr(S, R, rlen, p); rlen += rlen - 1; T = R; R = S; S = T; } } _fmpz_vec_clear(v, alloc); } void fmpz_mod_poly_pow(fmpz_mod_poly_t rop, const fmpz_mod_poly_t op, ulong e, const fmpz_mod_ctx_t ctx) { const slong len = op->length; slong rlen; if ((len < 2) || (e < UWORD(3))) { if (e == UWORD(0)) fmpz_mod_poly_set_ui(rop, 1, ctx); else if (len == 0) fmpz_mod_poly_zero(rop, ctx); else if (len == 1) { fmpz_mod_poly_fit_length(rop, 1, ctx); fmpz_powm_ui(rop->coeffs, op->coeffs, e, fmpz_mod_ctx_modulus(ctx)); _fmpz_mod_poly_set_length(rop, 1); _fmpz_mod_poly_normalise(rop); } else if (e == UWORD(1)) fmpz_mod_poly_set(rop, op, ctx); else /* e == UWORD(2) */ fmpz_mod_poly_sqr(rop, op, ctx); return; } rlen = (slong) e * (len - 1) + 1; if (rop != op) { fmpz_mod_poly_fit_length(rop, rlen, ctx); _fmpz_mod_poly_pow(rop->coeffs, op->coeffs, len, e, fmpz_mod_ctx_modulus(ctx)); _fmpz_mod_poly_set_length(rop, rlen); } else { fmpz *t = _fmpz_vec_init(rlen); _fmpz_mod_poly_pow(t, op->coeffs, len, e, fmpz_mod_ctx_modulus(ctx)); _fmpz_vec_clear(rop->coeffs, rop->alloc); rop->coeffs = t; rop->alloc = rlen; rop->length = rlen; } _fmpz_mod_poly_normalise(rop); }