/*
Copyright (C) 2008, 2009 William Hart
Copyright (C) 2010, 2012 Sebastian Pancratz
This file is part of FLINT.
FLINT is free software: you can redistribute it and/or modify it under
the terms of the GNU Lesser General Public License (LGPL) as published
by the Free Software Foundation; either version 2.1 of the License, or
(at your option) any later version. See .
*/
#include
#include
#include "flint.h"
#include "fmpz.h"
#include "fmpz_vec.h"
#include "fmpz_poly.h"
#include "fft.h"
void
_fmpz_poly_mul_KS(fmpz * res, const fmpz * poly1, slong len1,
const fmpz * poly2, slong len2)
{
const slong in1_len = len1, in2_len = len2;
int neg1, neg2;
slong limbs1, limbs2, loglen;
slong bits1, bits2, bits;
mp_limb_t *arr1, *arr2, *arr3;
slong sign = 0;
FMPZ_VEC_NORM(poly1, len1);
FMPZ_VEC_NORM(poly2, len2);
if (!len1 | !len2)
{
if (in1_len + in2_len - 1 > 0)
_fmpz_vec_zero(res, in1_len + in2_len - 1);
return;
}
neg1 = (fmpz_sgn(poly1 + len1 - 1) > 0) ? 0 : -1;
neg2 = (fmpz_sgn(poly2 + len2 - 1) > 0) ? 0 : -1;
bits1 = _fmpz_vec_max_bits(poly1, len1);
if (bits1 < 0)
{
sign = 1;
bits1 = -bits1;
}
if (poly1 != poly2)
{
bits2 = _fmpz_vec_max_bits(poly2, len2);
if (bits2 < 0)
{
sign = 1;
bits2 = -bits2;
}
}
else
bits2 = bits1;
loglen = FLINT_BIT_COUNT(FLINT_MIN(len1, len2));
bits = bits1 + bits2 + loglen + sign;
limbs1 = (bits * len1 - 1) / FLINT_BITS + 1;
limbs2 = (bits * len2 - 1) / FLINT_BITS + 1;
if (poly1 == poly2)
{
arr1 = (mp_limb_t *) flint_calloc(limbs1, sizeof(mp_limb_t));
arr2 = arr1;
_fmpz_poly_bit_pack(arr1, poly1, len1, bits, neg1);
}
else
{
arr1 = (mp_limb_t *) flint_calloc(limbs1 + limbs2, sizeof(mp_limb_t));
arr2 = arr1 + limbs1;
_fmpz_poly_bit_pack(arr1, poly1, len1, bits, neg1);
_fmpz_poly_bit_pack(arr2, poly2, len2, bits, neg2);
}
arr3 = (mp_limb_t *) flint_malloc((limbs1 + limbs2) * sizeof(mp_limb_t));
if (limbs1 == limbs2)
{
if (limbs1 < 2000)
mpn_mul_n(arr3, arr1, arr2, limbs1);
else
flint_mpn_mul_fft_main(arr3, arr1, limbs1, arr2, limbs2);
} else if (limbs1 > limbs2)
{
if (limbs2 < 1000)
mpn_mul(arr3, arr1, limbs1, arr2, limbs2);
else
flint_mpn_mul_fft_main(arr3, arr1, limbs1, arr2, limbs2);
} else
{
if (limbs1 < 1000)
mpn_mul(arr3, arr2, limbs2, arr1, limbs1);
else
flint_mpn_mul_fft_main(arr3, arr2, limbs2, arr1, limbs1);
}
if (sign)
_fmpz_poly_bit_unpack(res, len1 + len2 - 1, arr3, bits, neg1 ^ neg2);
else
_fmpz_poly_bit_unpack_unsigned(res, len1 + len2 - 1, arr3, bits);
if ((len1 < in1_len) | (len2 < in2_len))
_fmpz_vec_zero(res + (len1 + len2 - 1), (in1_len - len1) + (in2_len - len2));
flint_free(arr1);
flint_free(arr3);
}
void
fmpz_poly_mul_KS(fmpz_poly_t res,
const fmpz_poly_t poly1, const fmpz_poly_t poly2)
{
const slong len1 = poly1->length;
const slong len2 = poly2->length;
const slong rlen = len1 + len2 - 1;
if (len1 == 0 || len2 == 0)
{
fmpz_poly_zero(res);
}
else
{
fmpz_poly_fit_length(res, rlen);
if (len1 >= len2)
_fmpz_poly_mul_KS(res->coeffs, poly1->coeffs, len1,
poly2->coeffs, len2);
else
_fmpz_poly_mul_KS(res->coeffs, poly2->coeffs, len2,
poly1->coeffs, len1);
_fmpz_poly_set_length(res, rlen);
}
}