/* Copyright (C) 2010 William Hart Copyright (C) 2010 Sebastian Pancratz This file is part of FLINT. FLINT is free software: you can redistribute it and/or modify it under the terms of the GNU Lesser General Public License (LGPL) as published by the Free Software Foundation; either version 2.1 of the License, or (at your option) any later version. See . */ #include #include #include "flint.h" #include "nmod_vec.h" #include "nmod_poly.h" void _nmod_poly_mul_KS(mp_ptr out, mp_srcptr in1, slong len1, mp_srcptr in2, slong len2, flint_bitcnt_t bits, nmod_t mod) { slong len_out = len1 + len2 - 1, limbs1, limbs2; mp_ptr tmp, mpn1, mpn2, res; int squaring; TMP_INIT; squaring = (in1 == in2 && len1 == len2); if (bits == 0) { flint_bitcnt_t bits1, bits2, loglen; /* Look at the actual bits of the input? This slows down the generic case. Are there situations where we care enough about special input? */ #if 0 bits1 = _nmod_vec_max_bits2(in1, len1); bits2 = squaring ? bits1 : _nmod_vec_max_bits2(in2, len2); #else bits1 = FLINT_BITS - (slong) mod.norm; bits2 = bits1; #endif loglen = FLINT_BIT_COUNT(len2); bits = bits1 + bits2 + loglen; } limbs1 = (len1 * bits - 1) / FLINT_BITS + 1; limbs2 = (len2 * bits - 1) / FLINT_BITS + 1; TMP_START; tmp = TMP_ALLOC(sizeof(mp_limb_t) * (limbs1 + limbs2 + limbs1 + (squaring ? 0 : limbs2))); res = tmp; mpn1 = tmp + limbs1 + limbs2; mpn2 = squaring ? mpn1 : (mpn1 + limbs1); _nmod_poly_bit_pack(mpn1, in1, len1, bits); if (!squaring) _nmod_poly_bit_pack(mpn2, in2, len2, bits); if (squaring) mpn_sqr(res, mpn1, limbs1); else mpn_mul(res, mpn1, limbs1, mpn2, limbs2); _nmod_poly_bit_unpack(out, len_out, res, bits, mod); TMP_END; } void nmod_poly_mul_KS(nmod_poly_t res, const nmod_poly_t poly1, const nmod_poly_t poly2, flint_bitcnt_t bits) { slong len_out; if ((poly1->length == 0) || (poly2->length == 0)) { nmod_poly_zero(res); return; } len_out = poly1->length + poly2->length - 1; if (res == poly1 || res == poly2) { nmod_poly_t temp; nmod_poly_init2_preinv(temp, poly1->mod.n, poly1->mod.ninv, len_out); if (poly1->length >= poly2->length) _nmod_poly_mul_KS(temp->coeffs, poly1->coeffs, poly1->length, poly2->coeffs, poly2->length, bits, poly1->mod); else _nmod_poly_mul_KS(temp->coeffs, poly2->coeffs, poly2->length, poly1->coeffs, poly1->length, bits, poly1->mod); nmod_poly_swap(res, temp); nmod_poly_clear(temp); } else { nmod_poly_fit_length(res, len_out); if (poly1->length >= poly2->length) _nmod_poly_mul_KS(res->coeffs, poly1->coeffs, poly1->length, poly2->coeffs, poly2->length, bits, poly1->mod); else _nmod_poly_mul_KS(res->coeffs, poly2->coeffs, poly2->length, poly1->coeffs, poly1->length, bits, poly1->mod); } res->length = len_out; _nmod_poly_normalise(res); }