/*
Copyright (C) 2009, 2011 William Hart
This file is part of FLINT.
FLINT is free software: you can redistribute it and/or modify it under
the terms of the GNU Lesser General Public License (LGPL) as published
by the Free Software Foundation; either version 2.1 of the License, or
(at your option) any later version. See .
*/
#include
#include
#include
#include "flint.h"
#include "ulong_extras.h"
#include "mpn_extras.h"
#include "fft.h"
/* set p = 2^wn + 1 */
void set_p(mpz_t p, mp_size_t n, flint_bitcnt_t w)
{
flint_mpz_set_ui(p, 1);
mpz_mul_2exp(p, p, n*w);
flint_mpz_add_ui(p, p, 1);
}
void ref_fft_butterfly_sqrt2(mpz_t s, mpz_t t, mpz_t i1, mpz_t i2,
mpz_t p, mp_size_t i, mp_size_t limbs, mp_size_t w)
{
mpz_sub(t, i1, i2);
mpz_mul_2exp(t, t, i*(w/2) + i/2);
mpz_mul_2exp(s, t, 3*limbs*FLINT_BITS/4);
mpz_mul_2exp(t, t, limbs*FLINT_BITS/4);
mpz_sub(t, s, t);
mpz_add(s, i1, i2);
mpz_mod(s, s, p);
mpz_mod(t, t, p);
}
void ref_ifft_butterfly_sqrt2(mpz_t s, mpz_t t, mpz_t i1, mpz_t i2,
mpz_t p, mp_size_t i, mp_size_t n, mp_size_t limbs, mp_size_t w)
{
mpz_mul_2exp(s, i2, 2*n*w - i*(w/2) - 1 - i/2);
mpz_mul_2exp(t, s, 3*limbs*FLINT_BITS/4);
mpz_mul_2exp(s, s, limbs*FLINT_BITS/4);
mpz_sub(i2, t, s);
mpz_add(s, i1, i2);
mpz_sub(t, i1, i2);
mpz_mod(s, s, p);
mpz_mod(t, t, p);
}
int
main(void)
{
mp_size_t c, bits, j, k, n, w, limbs;
mpz_t p, ma, mb, m2a, m2b, mn1, mn2;
mp_limb_t * nn1, * nn2, * r1, * r2, * temp;
FLINT_TEST_INIT(state);
flint_printf("fft/ifft_butterfly_sqrt2....");
fflush(stdout);
_flint_rand_init_gmp(state);
mpz_init(p);
mpz_init(ma);
mpz_init(mb);
mpz_init(m2a);
mpz_init(m2b);
mpz_init(mn1);
mpz_init(mn2);
for (bits = FLINT_BITS; bits < 20*FLINT_BITS; bits += FLINT_BITS)
{
for (j = 1; j < 10; j++)
{
for (k = 1; k <= FLINT_BITS; k <<= 1)
{
n = bits/k;
w = j*k;
if ((w & 1) == 0) continue; /* w must be odd here */
limbs = (n*w)/FLINT_BITS;
for (c = 1; c < 2*n; c+=2)
{
nn1 = flint_malloc((limbs + 1)*sizeof(mp_limb_t));
nn2 = flint_malloc((limbs + 1)*sizeof(mp_limb_t));
temp = flint_malloc((limbs + 1)*sizeof(mp_limb_t));
r1 = flint_malloc((limbs + 1)*sizeof(mp_limb_t));
r2 = flint_malloc((limbs + 1)*sizeof(mp_limb_t));
random_fermat(nn1, state, limbs);
random_fermat(nn2, state, limbs);
fermat_to_mpz(mn1, nn1, limbs);
fermat_to_mpz(mn2, nn2, limbs);
set_p(p, n, w);
fft_butterfly_sqrt2(r1, r2, nn1, nn2, c, limbs, w, temp);
fermat_to_mpz(m2a, r1, limbs);
fermat_to_mpz(m2b, r2, limbs);
mpz_mod(m2a, m2a, p);
mpz_mod(m2b, m2b, p);
ref_fft_butterfly_sqrt2(ma, mb, mn1, mn2, p, c, limbs, w);
if (mpz_cmp(ma, m2a) != 0)
{
flint_printf("FAIL:\n");
flint_printf("fft_butterfly_sqrt2 error a\n");
flint_printf("limbs = %wd\n", limbs);
flint_printf("n = %wd, w = %wd, k = %wd, c = %wd\n", n, w, k, c);
gmp_printf("want %Zx\n\n", ma);
gmp_printf("got %Zx\n", m2a);
abort();
}
if (mpz_cmp(mb, m2b) != 0)
{
flint_printf("FAIL:\n");
flint_printf("fft_butterfly_sqrt2 error b\n");
flint_printf("limbs = %wd\n", limbs);
flint_printf("n = %wd, w = %wd, k = %wd, c = %wd\n", n, w, k, c);
gmp_printf("want %Zx\n\n", mb);
gmp_printf("got %Zx\n", m2b);
abort();
}
flint_free(temp);
flint_free(nn1);
flint_free(nn2);
flint_free(r1);
flint_free(r2);
}
}
}
}
for (bits = FLINT_BITS; bits < 20*FLINT_BITS; bits += FLINT_BITS)
{
for (j = 1; j < 10; j++)
{
for (k = 1; k <= FLINT_BITS; k <<= 1)
{
n = bits/k;
w = j*k;
if ((w & 1) == 0) continue; /* w must be odd here */
limbs = (n*w)/FLINT_BITS;
for (c = 1; c < 2*n; c+=2)
{
nn1 = flint_malloc((limbs + 1)*sizeof(mp_limb_t));
nn2 = flint_malloc((limbs + 1)*sizeof(mp_limb_t));
temp = flint_malloc((limbs + 1)*sizeof(mp_limb_t));
r1 = flint_malloc((limbs + 1)*sizeof(mp_limb_t));
r2 = flint_malloc((limbs + 1)*sizeof(mp_limb_t));
random_fermat(nn1, state, limbs);
random_fermat(nn2, state, limbs);
fermat_to_mpz(mn1, nn1, limbs);
fermat_to_mpz(mn2, nn2, limbs);
set_p(p, n, w);
ifft_butterfly_sqrt2(r1, r2, nn1, nn2, c, limbs, w, temp);
fermat_to_mpz(m2a, r1, limbs);
fermat_to_mpz(m2b, r2, limbs);
mpz_mod(m2a, m2a, p);
mpz_mod(m2b, m2b, p);
ref_ifft_butterfly_sqrt2(ma, mb, mn1, mn2, p, c, n, limbs, w);
if (mpz_cmp(ma, m2a) != 0)
{
flint_printf("FAIL:\n");
flint_printf("ifft_butterfly_sqrt2 error a\n");
flint_printf("limbs = %wd\n", limbs);
flint_printf("n = %wd, w = %wd, k = %wd, c = %wd\n", n, w, k, c);
gmp_printf("want %Zx\n\n", ma);
gmp_printf("got %Zx\n", m2a);
abort();
}
if (mpz_cmp(mb, m2b) != 0)
{
flint_printf("FAIL:\n");
flint_printf("ifft_butterfly_sqrt2 error b\n");
flint_printf("limbs = %wd\n", limbs);
flint_printf("n = %wd, w = %wd, k = %wd, c = %wd\n", n, w, k, c);
gmp_printf("want %Zx\n\n", mb);
gmp_printf("got %Zx\n", m2b);
abort();
}
flint_free(temp);
flint_free(nn1);
flint_free(nn2);
flint_free(r1);
flint_free(r2);
}
}
}
}
mpz_clear(p);
mpz_clear(ma);
mpz_clear(mb);
mpz_clear(m2a);
mpz_clear(m2b);
mpz_clear(mn1);
mpz_clear(mn2);
FLINT_TEST_CLEANUP(state);
flint_printf("PASS\n");
return 0;
}