mirror of
https://github.com/vale981/arb
synced 2025-03-04 17:01:40 -05:00
331 lines
8.4 KiB
C
331 lines
8.4 KiB
C
/*
|
|
Copyright (C) 2016 Pascal Molin
|
|
|
|
This file is part of Arb.
|
|
|
|
Arb is free software: you can redistribute it and/or modify it under
|
|
the terms of the GNU Lesser General Public License (LGPL) as published
|
|
by the Free Software Foundation; either version 2.1 of the License, or
|
|
(at your option) any later version. See <http://www.gnu.org/licenses/>.
|
|
*/
|
|
|
|
#ifndef ACB_DFT_H
|
|
#define ACB_DFT_H
|
|
|
|
#ifdef ACB_DFT_INLINES_C
|
|
#define ACB_DFT_INLINE
|
|
#else
|
|
#define ACB_DFT_INLINE static __inline__
|
|
#endif
|
|
|
|
#include "acb.h"
|
|
#include "dlog.h"
|
|
|
|
#ifdef __cplusplus
|
|
extern "C" {
|
|
#endif
|
|
|
|
void _acb_dft_naive(acb_ptr w, acb_srcptr v, slong dv, acb_srcptr z, slong dz, slong len, slong prec);
|
|
void acb_dft_naive(acb_ptr w, acb_srcptr v, slong len, slong prec);
|
|
void acb_dft_crt(acb_ptr w, acb_srcptr v, slong len, slong prec);
|
|
void acb_dft_cyc(acb_ptr w, acb_srcptr v, slong len, slong prec);
|
|
void acb_dft_rad2_inplace(acb_ptr v, int e, slong prec);
|
|
void acb_dft_rad2(acb_ptr w, acb_srcptr v, int e, slong prec);
|
|
void acb_dft_bluestein(acb_ptr w, acb_srcptr v, slong len, slong prec);
|
|
void acb_dft_prod(acb_ptr w, acb_srcptr v, slong * cyc, slong num, slong prec);
|
|
|
|
void acb_dft_rad2_inplace_threaded(acb_ptr v, int e, slong prec);
|
|
|
|
void acb_dft_convol_naive(acb_ptr w, acb_srcptr f, acb_srcptr g, slong len, slong prec);
|
|
void acb_dft_convol_dft(acb_ptr w, acb_srcptr f, acb_srcptr g, slong len, slong prec);
|
|
void acb_dft_convol_rad2(acb_ptr w, acb_srcptr f, acb_srcptr g, slong len, slong prec);
|
|
void acb_dft_convol_mullow(acb_ptr w, acb_srcptr f, acb_srcptr g, slong len, slong prec);
|
|
void acb_dft_convol(acb_ptr w, acb_srcptr f, acb_srcptr g, slong len, slong prec);
|
|
|
|
#define CRT_MAX 15
|
|
typedef struct
|
|
{
|
|
int num;
|
|
nmod_t n;
|
|
slong m[CRT_MAX];
|
|
ulong M[CRT_MAX];
|
|
ulong vM[CRT_MAX];
|
|
}
|
|
crt_struct;
|
|
|
|
typedef crt_struct crt_t[1];
|
|
|
|
void crt_init(crt_t c, ulong n);
|
|
|
|
void crt_decomp(acb_ptr y, acb_srcptr x, slong dx, const crt_t c, ulong len);
|
|
void crt_recomp(acb_ptr y, acb_srcptr x, const crt_t c, ulong len);
|
|
|
|
typedef struct acb_dft_step_struct acb_dft_step_struct;
|
|
typedef acb_dft_step_struct * acb_dft_step_ptr;
|
|
|
|
typedef struct
|
|
{
|
|
slong n;
|
|
acb_ptr z;
|
|
int zclear;
|
|
slong num;
|
|
acb_dft_step_ptr cyc;
|
|
}
|
|
acb_dft_cyc_struct;
|
|
|
|
typedef acb_dft_cyc_struct acb_dft_cyc_t[1];
|
|
|
|
typedef struct
|
|
{
|
|
int e;
|
|
slong n; /* = 1 << e */
|
|
slong dv;
|
|
slong nz; /* = n but could be bigger */
|
|
acb_ptr z;
|
|
}
|
|
acb_dft_rad2_struct;
|
|
|
|
typedef acb_dft_rad2_struct acb_dft_rad2_t[1];
|
|
|
|
typedef struct
|
|
{
|
|
slong n;
|
|
slong dv;
|
|
acb_ptr z; /* z[k] = e(k^2/2n) */
|
|
acb_ptr g; /* g[k] = dft( z ) */
|
|
acb_dft_rad2_t rad2;
|
|
}
|
|
acb_dft_bluestein_struct;
|
|
|
|
typedef acb_dft_bluestein_struct acb_dft_bluestein_t[1];
|
|
|
|
typedef struct
|
|
{
|
|
slong n;
|
|
slong num;
|
|
acb_dft_step_ptr cyc;
|
|
}
|
|
acb_dft_prod_struct;
|
|
|
|
typedef acb_dft_prod_struct acb_dft_prod_t[1];
|
|
|
|
typedef struct
|
|
{
|
|
slong n;
|
|
crt_t c;
|
|
slong dv;
|
|
/* then a product */
|
|
acb_dft_step_ptr cyc;
|
|
}
|
|
acb_dft_crt_struct;
|
|
|
|
typedef acb_dft_crt_struct acb_dft_crt_t[1];
|
|
|
|
typedef struct
|
|
{
|
|
slong n;
|
|
slong dv;
|
|
int zclear;
|
|
acb_ptr z;
|
|
slong dz;
|
|
}
|
|
acb_dft_naive_struct;
|
|
|
|
typedef acb_dft_naive_struct acb_dft_naive_t[1];
|
|
|
|
typedef struct
|
|
{
|
|
slong n;
|
|
int type;
|
|
union
|
|
{
|
|
acb_dft_rad2_t rad2;
|
|
acb_dft_cyc_t cyc;
|
|
acb_dft_prod_t prod;
|
|
acb_dft_crt_t crt;
|
|
acb_dft_naive_t naive;
|
|
acb_dft_bluestein_t bluestein;
|
|
} t;
|
|
}
|
|
acb_dft_pre_struct;
|
|
|
|
typedef acb_dft_pre_struct acb_dft_pre_t[1];
|
|
|
|
/* covers both product and cyclic case */
|
|
struct
|
|
acb_dft_step_struct
|
|
{
|
|
/* [G:H] */
|
|
slong m;
|
|
/* card H */
|
|
slong M;
|
|
slong dv; /* = M for prod, also = M if cyc is reordered */
|
|
/* pointer on some roots of unity, if needed */
|
|
acb_srcptr z;
|
|
/* index of mM in z */
|
|
slong dz;
|
|
/* dft to call on H */
|
|
acb_dft_pre_t pre;
|
|
/* dft to call on G/H ? */
|
|
};
|
|
|
|
/*typedef acb_dft_pre_struct acb_dft_pre_t[1];*/
|
|
|
|
#define DFT_VERB 0
|
|
|
|
enum
|
|
{
|
|
DFT_NAIVE, DFT_CYC, DFT_PROD, DFT_CRT , DFT_RAD2 , DFT_CONV
|
|
};
|
|
|
|
void acb_dft_step(acb_ptr w, acb_srcptr v, acb_dft_step_ptr cyc, slong num, slong prec);
|
|
|
|
void acb_dft_precomp(acb_ptr w, acb_srcptr v, const acb_dft_pre_t pre, slong prec);
|
|
void acb_dft_inverse_precomp(acb_ptr w, acb_srcptr v, const acb_dft_pre_t pre, slong prec);
|
|
void acb_dft_naive_precomp(acb_ptr w, acb_srcptr v, const acb_dft_naive_t pol, slong prec);
|
|
void acb_dft_cyc_precomp(acb_ptr w, acb_srcptr v, const acb_dft_cyc_t cyc, slong prec);
|
|
|
|
void acb_dft_rad2_precomp_inplace(acb_ptr v, const acb_dft_rad2_t rad2, slong prec);
|
|
void acb_dft_rad2_precomp(acb_ptr w, acb_srcptr v, const acb_dft_rad2_t rad2, slong prec);
|
|
void acb_dft_crt_precomp(acb_ptr w, acb_srcptr v, const acb_dft_crt_t crt, slong prec);
|
|
void acb_dft_prod_precomp(acb_ptr w, acb_srcptr v, const acb_dft_prod_t prod, slong prec);
|
|
void acb_dft_bluestein_precomp(acb_ptr w, acb_srcptr v, const acb_dft_bluestein_t t, slong prec);
|
|
|
|
void acb_dft_rad2_precomp_inplace_threaded(acb_ptr v, const acb_dft_rad2_t rad2, slong prec);
|
|
|
|
void acb_dft_inverse_rad2_precomp_inplace(acb_ptr v, const acb_dft_rad2_t rad2, slong prec);
|
|
void acb_dft_inverse_rad2_precomp(acb_ptr w, acb_srcptr v, const acb_dft_rad2_t rad2, slong prec);
|
|
void acb_dft_convol_rad2_precomp(acb_ptr w, acb_srcptr f, acb_srcptr g, slong len, const acb_dft_rad2_t, slong prec);
|
|
|
|
void _acb_dft_precomp_init(acb_dft_pre_t pre, slong dv, acb_ptr z, slong dz, slong len, slong prec);
|
|
void acb_dft_precomp_init(acb_dft_pre_t pre, slong len, slong prec);
|
|
void acb_dft_precomp_clear(acb_dft_pre_t pre);
|
|
|
|
void acb_dft(acb_ptr w, acb_srcptr v, slong len, slong prec);
|
|
void acb_dft_inverse(acb_ptr w, acb_srcptr v, slong len, slong prec);
|
|
|
|
acb_dft_step_ptr _acb_dft_steps_prod(slong * m, slong num, slong prec);
|
|
|
|
ACB_DFT_INLINE void
|
|
acb_dft_prod_init(acb_dft_prod_t t, slong * cyc, slong num, slong prec)
|
|
{
|
|
t->num = num;
|
|
t->cyc = _acb_dft_steps_prod(cyc, num, prec);
|
|
}
|
|
|
|
void acb_dft_prod_clear(acb_dft_prod_t t);
|
|
|
|
void _acb_dft_cyc_init_z_fac(acb_dft_cyc_t t, n_factor_t fac, slong dv, acb_ptr z, slong dz, slong len, slong prec);
|
|
void _acb_dft_cyc_init(acb_dft_cyc_t t, slong dv, slong len, slong prec);
|
|
|
|
ACB_DFT_INLINE void
|
|
acb_dft_cyc_init(acb_dft_cyc_t t, slong len, slong prec)
|
|
{
|
|
_acb_dft_cyc_init(t, 1, len, prec);
|
|
}
|
|
|
|
void acb_dft_cyc_clear(acb_dft_cyc_t t);
|
|
|
|
void _acb_dft_naive_init(acb_dft_naive_t pol, slong dv, acb_ptr z, slong dz, slong len, slong prec);
|
|
|
|
ACB_DFT_INLINE void
|
|
acb_dft_naive_init(acb_dft_naive_t pol, slong len, slong prec)
|
|
{
|
|
_acb_dft_naive_init(pol, 1, NULL, 0, len, prec);
|
|
}
|
|
|
|
ACB_DFT_INLINE void
|
|
acb_dft_naive_clear(acb_dft_naive_t pol)
|
|
{
|
|
if (pol->zclear)
|
|
_acb_vec_clear(pol->z, pol->n);
|
|
}
|
|
|
|
void _acb_dft_rad2_init(acb_dft_rad2_t t, slong dv, int e, slong prec);
|
|
|
|
ACB_DFT_INLINE void
|
|
acb_dft_rad2_init(acb_dft_rad2_t t, int e, slong prec)
|
|
{
|
|
_acb_dft_rad2_init(t, 1, e, prec);
|
|
}
|
|
|
|
ACB_DFT_INLINE void
|
|
acb_dft_rad2_clear(acb_dft_rad2_t t)
|
|
{
|
|
_acb_vec_clear(t->z, t->nz);
|
|
}
|
|
|
|
void _acb_dft_bluestein_init(acb_dft_bluestein_t t, slong dv, slong n, slong prec);
|
|
|
|
ACB_DFT_INLINE void
|
|
acb_dft_bluestein_init(acb_dft_bluestein_t t, slong n, slong prec)
|
|
{
|
|
_acb_dft_bluestein_init(t, 1, n, prec);
|
|
}
|
|
|
|
ACB_DFT_INLINE void
|
|
acb_dft_bluestein_clear(acb_dft_bluestein_t t)
|
|
{
|
|
if (t->n != 0)
|
|
{
|
|
_acb_vec_clear(t->z, t->n);
|
|
_acb_vec_clear(t->g, t->rad2->n);
|
|
acb_dft_rad2_clear(t->rad2);
|
|
}
|
|
}
|
|
|
|
void _acb_dft_crt_init(acb_dft_crt_t crt, slong dv, slong len, slong prec);
|
|
void acb_dft_crt_init(acb_dft_crt_t crt, slong len, slong prec);
|
|
void acb_dft_crt_clear(acb_dft_crt_t crt);
|
|
|
|
/* utils, could be moved elsewhere */
|
|
|
|
ACB_DFT_INLINE void
|
|
acb_swap_ri(acb_t x)
|
|
{
|
|
arb_swap(acb_realref(x), acb_imagref(x));
|
|
}
|
|
|
|
ACB_DFT_INLINE void
|
|
acb_vec_swap_ri(acb_ptr v, slong len)
|
|
{
|
|
slong k;
|
|
for (k = 0; k < len; k++)
|
|
acb_swap_ri(v + k);
|
|
}
|
|
|
|
ACB_DFT_INLINE void
|
|
_acb_vec_kronecker_mul(acb_ptr z, acb_srcptr x, acb_srcptr y, slong len, slong prec)
|
|
{
|
|
slong k;
|
|
for (k = 0; k < len; k++)
|
|
acb_mul(z + k, x + k, y + k, prec);
|
|
}
|
|
|
|
ACB_DFT_INLINE void
|
|
_acb_vec_kronecker_mul_step(acb_ptr z, acb_srcptr x, acb_srcptr y, slong step, slong len, slong prec)
|
|
{
|
|
slong k;
|
|
for (k = 0; k < len; k++)
|
|
{
|
|
acb_mul(z + k, x + k, y + k * step, prec);
|
|
}
|
|
}
|
|
|
|
ACB_DFT_INLINE void
|
|
acb_vec_printd_index(acb_srcptr vec, slong len, slong digits)
|
|
{
|
|
slong i;
|
|
for (i = 0; i < len; i++)
|
|
{
|
|
flint_printf("[%wd] ", i);
|
|
acb_printd(vec + i, digits);
|
|
flint_printf("\n");
|
|
}
|
|
}
|
|
|
|
#ifdef __cplusplus
|
|
}
|
|
#endif
|
|
|
|
#endif
|