cannam@95: /* cannam@95: * Copyright (c) 2003, 2007-11 Matteo Frigo cannam@95: * Copyright (c) 2003, 2007-11 Massachusetts Institute of Technology cannam@95: * cannam@95: * This program is free software; you can redistribute it and/or modify cannam@95: * it under the terms of the GNU General Public License as published by cannam@95: * the Free Software Foundation; either version 2 of the License, or cannam@95: * (at your option) any later version. cannam@95: * cannam@95: * This program is distributed in the hope that it will be useful, cannam@95: * but WITHOUT ANY WARRANTY; without even the implied warranty of cannam@95: * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the cannam@95: * GNU General Public License for more details. cannam@95: * cannam@95: * You should have received a copy of the GNU General Public License cannam@95: * along with this program; if not, write to the Free Software cannam@95: * Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA cannam@95: * cannam@95: */ cannam@95: cannam@95: cannam@95: /* trigonometric functions */ cannam@95: #include "ifftw.h" cannam@95: #include cannam@95: cannam@95: #if defined(TRIGREAL_IS_LONG_DOUBLE) cannam@95: # define COS cosl cannam@95: # define SIN sinl cannam@95: # define KTRIG(x) (x##L) cannam@95: # ifndef HAVE_DECL_SINL cannam@95: extern long double sinl(long double x); cannam@95: # endif cannam@95: # ifndef HAVE_DECL_COSL cannam@95: extern long double cosl(long double x); cannam@95: # endif cannam@95: #elif defined(TRIGREAL_IS_QUAD) cannam@95: # define COS cosq cannam@95: # define SIN sinq cannam@95: # define KTRIG(x) (x##Q) cannam@95: extern __float128 sinq(__float128 x); cannam@95: extern __float128 cosq(__float128 x); cannam@95: #else cannam@95: # define COS cos cannam@95: # define SIN sin cannam@95: # define KTRIG(x) (x) cannam@95: #endif cannam@95: cannam@95: static const trigreal K2PI = cannam@95: KTRIG(6.2831853071795864769252867665590057683943388); cannam@95: #define by2pi(m, n) ((K2PI * (m)) / (n)) cannam@95: cannam@95: /* cannam@95: * Improve accuracy by reducing x to range [0..1/8] cannam@95: * before multiplication by 2 * PI. cannam@95: */ cannam@95: cannam@95: static void real_cexp(INT m, INT n, trigreal *out) cannam@95: { cannam@95: trigreal theta, c, s, t; cannam@95: unsigned octant = 0; cannam@95: INT quarter_n = n; cannam@95: cannam@95: n += n; n += n; cannam@95: m += m; m += m; cannam@95: cannam@95: if (m < 0) m += n; cannam@95: if (m > n - m) { m = n - m; octant |= 4; } cannam@95: if (m - quarter_n > 0) { m = m - quarter_n; octant |= 2; } cannam@95: if (m > quarter_n - m) { m = quarter_n - m; octant |= 1; } cannam@95: cannam@95: theta = by2pi(m, n); cannam@95: c = COS(theta); s = SIN(theta); cannam@95: cannam@95: if (octant & 1) { t = c; c = s; s = t; } cannam@95: if (octant & 2) { t = c; c = -s; s = t; } cannam@95: if (octant & 4) { s = -s; } cannam@95: cannam@95: out[0] = c; cannam@95: out[1] = s; cannam@95: } cannam@95: cannam@95: static INT choose_twshft(INT n) cannam@95: { cannam@95: INT log2r = 0; cannam@95: while (n > 0) { cannam@95: ++log2r; cannam@95: n /= 4; cannam@95: } cannam@95: return log2r; cannam@95: } cannam@95: cannam@95: static void cexpl_sqrtn_table(triggen *p, INT m, trigreal *res) cannam@95: { cannam@95: m += p->n * (m < 0); cannam@95: cannam@95: { cannam@95: INT m0 = m & p->twmsk; cannam@95: INT m1 = m >> p->twshft; cannam@95: trigreal wr0 = p->W0[2 * m0]; cannam@95: trigreal wi0 = p->W0[2 * m0 + 1]; cannam@95: trigreal wr1 = p->W1[2 * m1]; cannam@95: trigreal wi1 = p->W1[2 * m1 + 1]; cannam@95: cannam@95: res[0] = wr1 * wr0 - wi1 * wi0; cannam@95: res[1] = wi1 * wr0 + wr1 * wi0; cannam@95: } cannam@95: } cannam@95: cannam@95: /* multiply (xr, xi) by exp(FFT_SIGN * 2*pi*i*m/n) */ cannam@95: static void rotate_sqrtn_table(triggen *p, INT m, R xr, R xi, R *res) cannam@95: { cannam@95: m += p->n * (m < 0); cannam@95: cannam@95: { cannam@95: INT m0 = m & p->twmsk; cannam@95: INT m1 = m >> p->twshft; cannam@95: trigreal wr0 = p->W0[2 * m0]; cannam@95: trigreal wi0 = p->W0[2 * m0 + 1]; cannam@95: trigreal wr1 = p->W1[2 * m1]; cannam@95: trigreal wi1 = p->W1[2 * m1 + 1]; cannam@95: trigreal wr = wr1 * wr0 - wi1 * wi0; cannam@95: trigreal wi = wi1 * wr0 + wr1 * wi0; cannam@95: cannam@95: #if FFT_SIGN == -1 cannam@95: res[0] = xr * wr + xi * wi; cannam@95: res[1] = xi * wr - xr * wi; cannam@95: #else cannam@95: res[0] = xr * wr - xi * wi; cannam@95: res[1] = xi * wr + xr * wi; cannam@95: #endif cannam@95: } cannam@95: } cannam@95: cannam@95: static void cexpl_sincos(triggen *p, INT m, trigreal *res) cannam@95: { cannam@95: real_cexp(m, p->n, res); cannam@95: } cannam@95: cannam@95: static void cexp_zero(triggen *p, INT m, R *res) cannam@95: { cannam@95: UNUSED(p); UNUSED(m); cannam@95: res[0] = 0; cannam@95: res[1] = 0; cannam@95: } cannam@95: cannam@95: static void cexpl_zero(triggen *p, INT m, trigreal *res) cannam@95: { cannam@95: UNUSED(p); UNUSED(m); cannam@95: res[0] = 0; cannam@95: res[1] = 0; cannam@95: } cannam@95: cannam@95: static void cexp_generic(triggen *p, INT m, R *res) cannam@95: { cannam@95: trigreal resl[2]; cannam@95: p->cexpl(p, m, resl); cannam@95: res[0] = (R)resl[0]; cannam@95: res[1] = (R)resl[1]; cannam@95: } cannam@95: cannam@95: static void rotate_generic(triggen *p, INT m, R xr, R xi, R *res) cannam@95: { cannam@95: trigreal w[2]; cannam@95: p->cexpl(p, m, w); cannam@95: res[0] = xr * w[0] - xi * (FFT_SIGN * w[1]); cannam@95: res[1] = xi * w[0] + xr * (FFT_SIGN * w[1]); cannam@95: } cannam@95: cannam@95: triggen *X(mktriggen)(enum wakefulness wakefulness, INT n) cannam@95: { cannam@95: INT i, n0, n1; cannam@95: triggen *p = (triggen *)MALLOC(sizeof(*p), TWIDDLES); cannam@95: cannam@95: p->n = n; cannam@95: p->W0 = p->W1 = 0; cannam@95: p->cexp = 0; cannam@95: p->rotate = 0; cannam@95: cannam@95: switch (wakefulness) { cannam@95: case SLEEPY: cannam@95: A(0 /* can't happen */); cannam@95: break; cannam@95: cannam@95: case AWAKE_SQRTN_TABLE: { cannam@95: INT twshft = choose_twshft(n); cannam@95: cannam@95: p->twshft = twshft; cannam@95: p->twradix = ((INT)1) << twshft; cannam@95: p->twmsk = p->twradix - 1; cannam@95: cannam@95: n0 = p->twradix; cannam@95: n1 = (n + n0 - 1) / n0; cannam@95: cannam@95: p->W0 = (trigreal *)MALLOC(n0 * 2 * sizeof(trigreal), TWIDDLES); cannam@95: p->W1 = (trigreal *)MALLOC(n1 * 2 * sizeof(trigreal), TWIDDLES); cannam@95: cannam@95: for (i = 0; i < n0; ++i) cannam@95: real_cexp(i, n, p->W0 + 2 * i); cannam@95: cannam@95: for (i = 0; i < n1; ++i) cannam@95: real_cexp(i * p->twradix, n, p->W1 + 2 * i); cannam@95: cannam@95: p->cexpl = cexpl_sqrtn_table; cannam@95: p->rotate = rotate_sqrtn_table; cannam@95: break; cannam@95: } cannam@95: cannam@95: case AWAKE_SINCOS: cannam@95: p->cexpl = cexpl_sincos; cannam@95: break; cannam@95: cannam@95: case AWAKE_ZERO: cannam@95: p->cexp = cexp_zero; cannam@95: p->cexpl = cexpl_zero; cannam@95: break; cannam@95: } cannam@95: cannam@95: if (!p->cexp) { cannam@95: if (sizeof(trigreal) == sizeof(R)) cannam@95: p->cexp = (void (*)(triggen *, INT, R *))p->cexpl; cannam@95: else cannam@95: p->cexp = cexp_generic; cannam@95: } cannam@95: if (!p->rotate) cannam@95: p->rotate = rotate_generic; cannam@95: return p; cannam@95: } cannam@95: cannam@95: void X(triggen_destroy)(triggen *p) cannam@95: { cannam@95: X(ifree0)(p->W0); cannam@95: X(ifree0)(p->W1); cannam@95: X(ifree)(p); cannam@95: }