arb/acb_dft.h

330 lines
7.8 KiB
C
Raw Normal View History

/*
Copyright (C) 2016 Pascal Molin
This file is part of Arb.
Arb is free software: you can redistribute it and/or modify it under
the terms of the GNU Lesser General Public License (LGPL) as published
by the Free Software Foundation; either version 2.1 of the License, or
(at your option) any later version. See <http://www.gnu.org/licenses/>.
*/
#ifndef ACB_DFT_H
#define ACB_DFT_H
#ifdef ACB_DFT_INLINES_C
#define ACB_DFT_INLINE
#else
#define ACB_DFT_INLINE static __inline__
#endif
#include "acb.h"
#include "dlog.h"
#ifdef __cplusplus
extern "C" {
#endif
2017-10-02 14:22:50 +02:00
void _acb_dft_naive(acb_ptr w, acb_srcptr v, slong dv, acb_srcptr z, slong dz, slong len, slong prec);
void acb_dft_naive(acb_ptr w, acb_srcptr v, slong len, slong prec);
void acb_dft_crt(acb_ptr w, acb_srcptr v, slong len, slong prec);
void acb_dft_cyc(acb_ptr w, acb_srcptr v, slong len, slong prec);
void acb_dft_rad2(acb_ptr v, int e, slong prec);
void acb_dft_bluestein(acb_ptr w, acb_srcptr v, slong len, slong prec);
void acb_dft_prod(acb_ptr w, acb_srcptr v, slong * cyc, slong num, slong prec);
void acb_dft_convol_naive(acb_ptr w, acb_srcptr f, acb_srcptr g, slong len, slong prec);
void acb_dft_convol_rad2(acb_ptr w, acb_srcptr f, acb_srcptr g, slong len, slong prec);
#define CRT_MAX 15
typedef struct
{
int num;
nmod_t n;
slong m[CRT_MAX];
ulong M[CRT_MAX];
ulong vM[CRT_MAX];
}
crt_struct;
typedef crt_struct crt_t[1];
void crt_init(crt_t c, ulong n);
void crt_decomp(acb_ptr y, acb_srcptr x, slong dx, const crt_t c, ulong len);
void crt_recomp(acb_ptr y, acb_srcptr x, const crt_t c, ulong len);
typedef struct acb_dft_step_struct acb_dft_step_struct;
typedef acb_dft_step_struct * acb_dft_step_ptr;
typedef struct
{
slong n;
int zclear;
acb_ptr z;
slong num;
acb_dft_step_ptr cyc;
}
acb_dft_cyc_struct;
typedef acb_dft_cyc_struct acb_dft_cyc_t[1];
typedef struct
{
int e;
slong n; /* = 1 << e */
slong nz; /* = n but could be bigger */
acb_ptr z;
}
acb_dft_rad2_struct;
typedef acb_dft_rad2_struct acb_dft_rad2_t[1];
typedef struct
{
slong n;
2017-10-02 18:08:55 +02:00
acb_ptr z; /* z[k] = e(k^2/2n) */
acb_dft_rad2_t rad2;
}
acb_dft_bluestein_struct;
typedef acb_dft_bluestein_struct acb_dft_bluestein_t[1];
typedef struct
{
slong n;
slong num;
acb_dft_step_ptr cyc;
}
acb_dft_prod_struct;
typedef acb_dft_prod_struct acb_dft_prod_t[1];
typedef struct
{
slong n;
crt_t c;
slong dv;
/* then a product */
acb_dft_step_ptr cyc;
}
acb_dft_crt_struct;
typedef acb_dft_crt_struct acb_dft_crt_t[1];
typedef struct
{
slong n;
slong dv;
int zclear;
acb_ptr z;
slong dz;
}
2017-10-02 14:22:50 +02:00
acb_dft_naive_struct;
2017-10-02 14:22:50 +02:00
typedef acb_dft_naive_struct acb_dft_naive_t[1];
typedef struct
{
int type;
union
{
acb_dft_rad2_t rad2;
acb_dft_cyc_t cyc;
acb_dft_prod_t prod;
acb_dft_crt_t crt;
acb_dft_naive_t naive;
acb_dft_bluestein_t bluestein;
} t;
}
acb_dft_pre_struct;
typedef acb_dft_pre_struct acb_dft_pre_t[1];
/* covers both product and cyclic case */
struct
acb_dft_step_struct
{
/* [G:H] */
slong m;
/* card H */
slong M;
slong dv; /* = M for prod, also = M if cyc is reordered */
/* pointer on some roots of unity, if needed */
acb_srcptr z;
/* index of mM in z */
slong dz;
/* dft to call on H */
acb_dft_pre_t pre;
/* dft to call on G/H ? */
};
/*typedef acb_dft_pre_struct acb_dft_pre_t[1];*/
#define DFT_VERB 0
enum
{
DFT_NAIVE, DFT_CYC, DFT_PROD, DFT_CRT , DFT_RAD2 , DFT_CONV
};
void acb_dft_step(acb_ptr w, acb_srcptr v, acb_dft_step_ptr cyc, slong num, slong prec);
void acb_dft_precomp(acb_ptr w, acb_srcptr v, const acb_dft_pre_t pre, slong prec);
ACB_DFT_INLINE void
2017-10-02 14:22:50 +02:00
acb_dft_naive_precomp(acb_ptr w, acb_srcptr v, const acb_dft_naive_t pol, slong prec)
{
2017-10-02 14:22:50 +02:00
_acb_dft_naive(w, v, pol->dv, pol->z, pol->dz, pol->n, prec);
}
ACB_DFT_INLINE void
acb_dft_cyc_precomp(acb_ptr w, acb_srcptr v, const acb_dft_cyc_t cyc, slong prec)
{
acb_dft_step(w, v, cyc->cyc, cyc->num, prec);
}
void acb_dft_rad2_precomp(acb_ptr v, const acb_dft_rad2_t rad2, slong prec);
void acb_dft_crt_precomp(acb_ptr w, acb_srcptr v, const acb_dft_crt_t crt, slong prec);
void acb_dft_prod_precomp(acb_ptr w, acb_srcptr v, const acb_dft_prod_t prod, slong prec);
void acb_dft_bluestein_precomp(acb_ptr w, acb_srcptr v, const acb_dft_bluestein_t t, slong prec);
void acb_dft_inverse_rad2_precomp(acb_ptr v, const acb_dft_rad2_t rad2, slong prec);
void acb_dft_convol_rad2_precomp(acb_ptr w, acb_srcptr f, acb_srcptr g, slong len, const acb_dft_rad2_t, slong prec);
void _acb_dft_precomp_init(acb_dft_pre_t pre, slong dv, acb_ptr z, slong dz, slong len, slong prec);
void acb_dft_precomp_init(acb_dft_pre_t pre, slong len, slong prec);
void acb_dft_precomp_clear(acb_dft_pre_t pre);
2017-10-05 13:37:35 +02:00
void acb_dft(acb_ptr w, acb_srcptr v, slong len, slong prec);
acb_dft_step_ptr _acb_dft_steps_prod(slong * m, slong num, slong prec);
ACB_DFT_INLINE void
acb_dft_prod_init(acb_dft_prod_t t, slong * cyc, slong num, slong prec)
{
t->num = num;
t->cyc = _acb_dft_steps_prod(cyc, num, prec);
}
void acb_dft_prod_clear(acb_dft_prod_t t);
void _acb_dft_cyc_init_z_fac(acb_dft_cyc_t t, n_factor_t fac, slong dv, acb_ptr z, slong dz, slong len, slong prec);
void _acb_dft_cyc_init(acb_dft_cyc_t t, slong dv, slong len, slong prec);
ACB_DFT_INLINE void
acb_dft_cyc_init(acb_dft_cyc_t t, slong len, slong prec)
{
_acb_dft_cyc_init(t, 1, len, prec);
}
void acb_dft_cyc_clear(acb_dft_cyc_t t);
2017-10-02 14:22:50 +02:00
void _acb_dft_naive_init(acb_dft_naive_t pol, slong dv, acb_ptr z, slong dz, slong len, slong prec);
ACB_DFT_INLINE void
2017-10-02 14:22:50 +02:00
acb_dft_naive_init(acb_dft_naive_t pol, slong len, slong prec)
{
2017-10-02 14:22:50 +02:00
_acb_dft_naive_init(pol, 1, NULL, 0, len, prec);
}
ACB_DFT_INLINE void
2017-10-02 14:22:50 +02:00
acb_dft_naive_clear(acb_dft_naive_t pol)
{
if (pol->zclear)
_acb_vec_clear(pol->z, pol->n);
}
ACB_DFT_INLINE void
acb_dft_rad2_init(acb_dft_rad2_t t, int e, slong prec)
{
t->e = e;
t->n = 1 << e;
t->nz = t->n >> 1;
t->z = _acb_vec_init(2 * t->nz);
/* set n/2 roots of order n */
/* xxx: don't compute twice the number */
_acb_vec_unit_roots(t->z, t->n, prec);
}
ACB_DFT_INLINE void
acb_dft_rad2_clear(acb_dft_rad2_t t)
{
_acb_vec_clear(t->z, 2 * t->nz);
}
void acb_dft_bluestein_init(acb_dft_bluestein_t t, slong n, slong prec);
ACB_DFT_INLINE void
acb_dft_bluestein_clear(acb_dft_bluestein_t t)
{
_acb_vec_clear(t->z, t->n);
acb_dft_rad2_clear(t->rad2);
}
void _acb_dft_crt_init(acb_dft_crt_t crt, slong dv, slong len, slong prec);
ACB_DFT_INLINE void
acb_dft_crt_init(acb_dft_crt_t crt, slong len, slong prec)
{
crt->n = len;
crt_init(crt->c, len);
crt->dv = 1;
crt->cyc = _acb_dft_steps_prod(crt->c->m, crt->c->num, prec);
}
ACB_DFT_INLINE void
acb_dft_crt_clear(acb_dft_crt_t crt)
{
flint_free(crt->cyc);
}
/* utils, could be moved elsewhere */
ACB_DFT_INLINE void
acb_swap_ri(acb_t x)
{
arb_swap(acb_realref(x), acb_imagref(x));
}
ACB_DFT_INLINE void
acb_vec_swap_ri(acb_ptr v, slong len)
{
slong k;
for (k = 0; k < len; k++)
acb_swap_ri(v + k);
}
ACB_DFT_INLINE void
_acb_vec_kronecker_mul(acb_ptr z, acb_srcptr x, acb_srcptr y, slong len, slong prec)
{
slong k;
for (k = 0; k < len; k++)
acb_mul(z + k, x + k, y + k, prec);
}
2017-10-05 13:37:35 +02:00
/* FIXME: no longer used */
/* z[k] = conj(x[k])*y[k] */
ACB_DFT_INLINE void
acb_vec_kronecker_mul_conj(acb_ptr z, acb_srcptr x, acb_srcptr y, slong len, slong prec)
{
slong k;
for (k = 0; k < len; k++)
{
acb_conj(z + k, x + k);
acb_mul(z + k, z + k, y + k, prec);
}
}
ACB_DFT_INLINE void
acb_vec_printd_index(acb_srcptr vec, slong len, slong digits)
{
slong i;
for (i = 0; i < len; i++)
flint_printf("[%ld] ",i), acb_printd(vec + i, digits), flint_printf("\n");
}
#ifdef __cplusplus
}
#endif
#endif