/* Copyright (C) 2008, 2009, 2011 William Hart Copyright (C) 2011 Sebastian Pancratz Copyright (C) 2012 Fredrik Johansson This file is part of FLINT. FLINT is free software: you can redistribute it and/or modify it under the terms of the GNU Lesser General Public License (LGPL) as published by the Free Software Foundation; either version 2.1 of the License, or (at your option) any later version. See . */ #include #include #include "flint.h" #include "nmod_vec.h" #include "nmod_poly.h" static void __nmod_poly_divrem_divconquer(mp_ptr Q, mp_ptr R, mp_srcptr A, slong lenA, mp_srcptr B, slong lenB, nmod_t mod) { if (lenA < 2 * lenB - 1) { /* Convert unbalanced division into a 2 n1 - 1 by n1 division */ const slong n1 = lenA - lenB + 1; const slong n2 = lenB - n1; mp_srcptr p1 = A + n2; mp_srcptr d1 = B + n2; mp_srcptr d2 = B; mp_ptr V = _nmod_vec_init((n1 - 1) + lenB - 1 + NMOD_DIVREM_DC_ITCH(n1, mod)); mp_ptr W = V + NMOD_DIVREM_DC_ITCH(n1, mod); mp_ptr d1q1 = R + n2; mp_ptr d2q1 = W; _nmod_poly_divrem_divconquer_recursive(Q, d1q1, W, V, p1, d1, n1, mod); /* Compute d2q1 = Q d2, of length lenB - 1 */ if (n1 >= n2) _nmod_poly_mul(d2q1, Q, n1, d2, n2, mod); else _nmod_poly_mul(d2q1, d2, n2, Q, n1, mod); /* Compute BQ = d1q1 * x^n1 + d2q1, of length lenB - 1; then compute R = A - BQ */ flint_mpn_copyi(R, d2q1, n2); _nmod_vec_add(R + n2, R + n2, d2q1 + n2, n1 - 1, mod); _nmod_vec_sub(R, A, R, lenB - 1, mod); _nmod_vec_clear(V); } else /* lenA = 2 * lenB - 1 */ { mp_ptr V = _nmod_vec_init(lenB - 1 + NMOD_DIVREM_DC_ITCH(lenB, mod)); mp_ptr W = V + NMOD_DIVREM_DC_ITCH(lenB, mod); _nmod_poly_divrem_divconquer_recursive(Q, R, W, V, A, B, lenB, mod); _nmod_vec_sub(R, A, R, lenB - 1, mod); _nmod_vec_clear(V); } } void _nmod_poly_divrem_divconquer(mp_ptr Q, mp_ptr R, mp_srcptr A, slong lenA, mp_srcptr B, slong lenB, nmod_t mod) { if (lenA <= 2 * lenB - 1) { __nmod_poly_divrem_divconquer(Q, R, A, lenA, B, lenB, mod); } else /* lenA > 2 * lenB - 1 */ { slong shift, n = 2 * lenB - 1; mp_ptr S, QB, W, V, T; S = _nmod_vec_init(lenA + 2 * (lenB - 1) + n + NMOD_DIVREM_DC_ITCH(lenB, mod)); QB = S + lenA; W = QB + (lenB - 1); T = W + (lenB - 1); V = T + n; _nmod_vec_set(S, A, lenA); while (lenA >= n) { shift = lenA - n; _nmod_poly_divrem_divconquer_recursive(Q + shift, QB, W, V, S + shift, B, lenB, mod); _nmod_vec_sub(S + shift, S + shift, QB, lenB - 1, mod); lenA -= lenB; } if (lenA >= lenB) { __nmod_poly_divrem_divconquer(Q, T, S, lenA, B, lenB, mod); _nmod_vec_set(S, T, lenA); } _nmod_vec_set(R, S, lenB - 1); _nmod_vec_clear(S); } } void nmod_poly_divrem_divconquer(nmod_poly_t Q, nmod_poly_t R, const nmod_poly_t A, const nmod_poly_t B) { nmod_poly_t tQ, tR; mp_ptr q, r; slong lenA, lenB; lenA = A->length; lenB = B->length; if (lenB == 0) { if (nmod_poly_modulus(B) == 1) { nmod_poly_set(Q, A); nmod_poly_zero(R); return; } else { flint_printf("Exception (nmod_poly_divrem_divconquer). Division by zero.\n"); flint_abort(); } } if (lenA < lenB) { nmod_poly_set(R, A); nmod_poly_zero(Q); return; } if (Q == A || Q == B) { nmod_poly_init2(tQ, A->mod.n, lenA - lenB + 1); q = tQ->coeffs; } else { nmod_poly_fit_length(Q, lenA - lenB + 1); q = Q->coeffs; } if (R == A || R == B) { nmod_poly_init2(tR, A->mod.n, lenB - 1); r = tR->coeffs; } else { nmod_poly_fit_length(R, lenB - 1); r = R->coeffs; } _nmod_poly_divrem_divconquer(q, r, A->coeffs, lenA, B->coeffs, lenB, A->mod); if (Q == A || Q == B) { nmod_poly_swap(tQ, Q); nmod_poly_clear(tQ); } if (R == A || R == B) { nmod_poly_swap(tR, R); nmod_poly_clear(tR); } Q->length = lenA - lenB + 1; R->length = lenB - 1; _nmod_poly_normalise(R); }