/* Copyright (C) 2016 Pascal Molin This file is part of Arb. Arb is free software: you can redistribute it and/or modify it under the terms of the GNU Lesser General Public License (LGPL) as published by the Free Software Foundation; either version 2.1 of the License, or (at your option) any later version. See . */ #ifndef ACB_DFT_H #define ACB_DFT_H #ifdef ACB_DFT_INLINES_C #define ACB_DFT_INLINE #else #define ACB_DFT_INLINE static __inline__ #endif #include "acb.h" #include "dlog.h" #ifdef __cplusplus extern "C" { #endif void _acb_dft_naive(acb_ptr w, acb_srcptr v, slong dv, acb_srcptr z, slong dz, slong len, slong prec); void acb_dft_naive(acb_ptr w, acb_srcptr v, slong len, slong prec); void acb_dft_crt(acb_ptr w, acb_srcptr v, slong len, slong prec); void acb_dft_cyc(acb_ptr w, acb_srcptr v, slong len, slong prec); void acb_dft_rad2_inplace(acb_ptr v, int e, slong prec); void acb_dft_rad2(acb_ptr w, acb_srcptr v, int e, slong prec); void acb_dft_bluestein(acb_ptr w, acb_srcptr v, slong len, slong prec); void acb_dft_prod(acb_ptr w, acb_srcptr v, slong * cyc, slong num, slong prec); void acb_dft_rad2_inplace_threaded(acb_ptr v, int e, slong prec); void acb_dft_convol_naive(acb_ptr w, acb_srcptr f, acb_srcptr g, slong len, slong prec); void acb_dft_convol_dft(acb_ptr w, acb_srcptr f, acb_srcptr g, slong len, slong prec); void acb_dft_convol_rad2(acb_ptr w, acb_srcptr f, acb_srcptr g, slong len, slong prec); void acb_dft_convol_mullow(acb_ptr w, acb_srcptr f, acb_srcptr g, slong len, slong prec); void acb_dft_convol(acb_ptr w, acb_srcptr f, acb_srcptr g, slong len, slong prec); #define CRT_MAX 15 typedef struct { int num; nmod_t n; slong m[CRT_MAX]; ulong M[CRT_MAX]; ulong vM[CRT_MAX]; } crt_struct; typedef crt_struct crt_t[1]; void crt_init(crt_t c, ulong n); void crt_decomp(acb_ptr y, acb_srcptr x, slong dx, const crt_t c, ulong len); void crt_recomp(acb_ptr y, acb_srcptr x, const crt_t c, ulong len); typedef struct acb_dft_step_struct acb_dft_step_struct; typedef acb_dft_step_struct * acb_dft_step_ptr; typedef struct { slong n; acb_ptr z; int zclear; slong num; acb_dft_step_ptr cyc; } acb_dft_cyc_struct; typedef acb_dft_cyc_struct acb_dft_cyc_t[1]; typedef struct { int e; slong n; /* = 1 << e */ slong dv; slong nz; /* = n but could be bigger */ acb_ptr z; } acb_dft_rad2_struct; typedef acb_dft_rad2_struct acb_dft_rad2_t[1]; typedef struct { slong n; slong dv; acb_ptr z; /* z[k] = e(k^2/2n) */ acb_ptr g; /* g[k] = dft( z ) */ acb_dft_rad2_t rad2; } acb_dft_bluestein_struct; typedef acb_dft_bluestein_struct acb_dft_bluestein_t[1]; typedef struct { slong n; slong num; acb_dft_step_ptr cyc; } acb_dft_prod_struct; typedef acb_dft_prod_struct acb_dft_prod_t[1]; typedef struct { slong n; crt_t c; slong dv; /* then a product */ acb_dft_step_ptr cyc; } acb_dft_crt_struct; typedef acb_dft_crt_struct acb_dft_crt_t[1]; typedef struct { slong n; slong dv; int zclear; acb_ptr z; slong dz; } acb_dft_naive_struct; typedef acb_dft_naive_struct acb_dft_naive_t[1]; typedef struct { slong n; int type; union { acb_dft_rad2_t rad2; acb_dft_cyc_t cyc; acb_dft_prod_t prod; acb_dft_crt_t crt; acb_dft_naive_t naive; acb_dft_bluestein_t bluestein; } t; } acb_dft_pre_struct; typedef acb_dft_pre_struct acb_dft_pre_t[1]; /* covers both product and cyclic case */ struct acb_dft_step_struct { /* [G:H] */ slong m; /* card H */ slong M; slong dv; /* = M for prod, also = M if cyc is reordered */ /* pointer on some roots of unity, if needed */ acb_srcptr z; /* index of mM in z */ slong dz; /* dft to call on H */ acb_dft_pre_t pre; /* dft to call on G/H ? */ }; /*typedef acb_dft_pre_struct acb_dft_pre_t[1];*/ #define DFT_VERB 0 enum { DFT_NAIVE, DFT_CYC, DFT_PROD, DFT_CRT , DFT_RAD2 , DFT_CONV }; void acb_dft_step(acb_ptr w, acb_srcptr v, acb_dft_step_ptr cyc, slong num, slong prec); void acb_dft_precomp(acb_ptr w, acb_srcptr v, const acb_dft_pre_t pre, slong prec); void acb_dft_inverse_precomp(acb_ptr w, acb_srcptr v, const acb_dft_pre_t pre, slong prec); void acb_dft_naive_precomp(acb_ptr w, acb_srcptr v, const acb_dft_naive_t pol, slong prec); void acb_dft_cyc_precomp(acb_ptr w, acb_srcptr v, const acb_dft_cyc_t cyc, slong prec); void acb_dft_rad2_precomp_inplace(acb_ptr v, const acb_dft_rad2_t rad2, slong prec); void acb_dft_rad2_precomp(acb_ptr w, acb_srcptr v, const acb_dft_rad2_t rad2, slong prec); void acb_dft_crt_precomp(acb_ptr w, acb_srcptr v, const acb_dft_crt_t crt, slong prec); void acb_dft_prod_precomp(acb_ptr w, acb_srcptr v, const acb_dft_prod_t prod, slong prec); void acb_dft_bluestein_precomp(acb_ptr w, acb_srcptr v, const acb_dft_bluestein_t t, slong prec); void acb_dft_rad2_precomp_inplace_threaded(acb_ptr v, const acb_dft_rad2_t rad2, slong prec); void acb_dft_inverse_rad2_precomp_inplace(acb_ptr v, const acb_dft_rad2_t rad2, slong prec); void acb_dft_inverse_rad2_precomp(acb_ptr w, acb_srcptr v, const acb_dft_rad2_t rad2, slong prec); void acb_dft_convol_rad2_precomp(acb_ptr w, acb_srcptr f, acb_srcptr g, slong len, const acb_dft_rad2_t, slong prec); void _acb_dft_precomp_init(acb_dft_pre_t pre, slong dv, acb_ptr z, slong dz, slong len, slong prec); void acb_dft_precomp_init(acb_dft_pre_t pre, slong len, slong prec); void acb_dft_precomp_clear(acb_dft_pre_t pre); void acb_dft(acb_ptr w, acb_srcptr v, slong len, slong prec); void acb_dft_inverse(acb_ptr w, acb_srcptr v, slong len, slong prec); acb_dft_step_ptr _acb_dft_steps_prod(slong * m, slong num, slong prec); ACB_DFT_INLINE void acb_dft_prod_init(acb_dft_prod_t t, slong * cyc, slong num, slong prec) { t->num = num; t->cyc = _acb_dft_steps_prod(cyc, num, prec); } void acb_dft_prod_clear(acb_dft_prod_t t); void _acb_dft_cyc_init_z_fac(acb_dft_cyc_t t, n_factor_t fac, slong dv, acb_ptr z, slong dz, slong len, slong prec); void _acb_dft_cyc_init(acb_dft_cyc_t t, slong dv, slong len, slong prec); ACB_DFT_INLINE void acb_dft_cyc_init(acb_dft_cyc_t t, slong len, slong prec) { _acb_dft_cyc_init(t, 1, len, prec); } void acb_dft_cyc_clear(acb_dft_cyc_t t); void _acb_dft_naive_init(acb_dft_naive_t pol, slong dv, acb_ptr z, slong dz, slong len, slong prec); ACB_DFT_INLINE void acb_dft_naive_init(acb_dft_naive_t pol, slong len, slong prec) { _acb_dft_naive_init(pol, 1, NULL, 0, len, prec); } ACB_DFT_INLINE void acb_dft_naive_clear(acb_dft_naive_t pol) { if (pol->zclear) _acb_vec_clear(pol->z, pol->n); } void _acb_dft_rad2_init(acb_dft_rad2_t t, slong dv, int e, slong prec); ACB_DFT_INLINE void acb_dft_rad2_init(acb_dft_rad2_t t, int e, slong prec) { _acb_dft_rad2_init(t, 1, e, prec); } ACB_DFT_INLINE void acb_dft_rad2_clear(acb_dft_rad2_t t) { _acb_vec_clear(t->z, t->nz); } void _acb_dft_bluestein_init(acb_dft_bluestein_t t, slong dv, slong n, slong prec); ACB_DFT_INLINE void acb_dft_bluestein_init(acb_dft_bluestein_t t, slong n, slong prec) { _acb_dft_bluestein_init(t, 1, n, prec); } ACB_DFT_INLINE void acb_dft_bluestein_clear(acb_dft_bluestein_t t) { if (t->n != 0) { _acb_vec_clear(t->z, t->n); _acb_vec_clear(t->g, t->rad2->n); acb_dft_rad2_clear(t->rad2); } } void _acb_dft_crt_init(acb_dft_crt_t crt, slong dv, slong len, slong prec); void acb_dft_crt_init(acb_dft_crt_t crt, slong len, slong prec); void acb_dft_crt_clear(acb_dft_crt_t crt); /* utils, could be moved elsewhere */ ACB_DFT_INLINE void acb_swap_ri(acb_t x) { arb_swap(acb_realref(x), acb_imagref(x)); } ACB_DFT_INLINE void acb_vec_swap_ri(acb_ptr v, slong len) { slong k; for (k = 0; k < len; k++) acb_swap_ri(v + k); } ACB_DFT_INLINE void _acb_vec_kronecker_mul(acb_ptr z, acb_srcptr x, acb_srcptr y, slong len, slong prec) { slong k; for (k = 0; k < len; k++) acb_mul(z + k, x + k, y + k, prec); } ACB_DFT_INLINE void _acb_vec_kronecker_mul_step(acb_ptr z, acb_srcptr x, acb_srcptr y, slong step, slong len, slong prec) { slong k; for (k = 0; k < len; k++) { acb_mul(z + k, x + k, y + k * step, prec); } } ACB_DFT_INLINE void acb_vec_printd_index(acb_srcptr vec, slong len, slong digits) { slong i; for (i = 0; i < len; i++) { flint_printf("[%wd] ", i); acb_printd(vec + i, digits); flint_printf("\n"); } } #ifdef __cplusplus } #endif #endif