source: src/spectral/fft.c @ 69c39ca

feature/autosinkfeature/cnnfeature/cnn_orgfeature/constantqfeature/crepefeature/crepe_orgfeature/pitchshiftfeature/pydocstringsfeature/timestretchfix/ffmpeg5pitchshiftsamplertimestretchyinfft+
Last change on this file since 69c39ca was 69c39ca, checked in by Paul Brossier <piem@piem.org>, 11 years ago

src/spectral/fft.c: add vDSP for HAVE_AUBIO_DOUBLE

  • Property mode set to 100644
File size: 12.4 KB
RevLine 
[96fb8ad]1/*
[e6a78ea]2  Copyright (C) 2003-2009 Paul Brossier <piem@aubio.org>
[96fb8ad]3
[e6a78ea]4  This file is part of aubio.
[96fb8ad]5
[e6a78ea]6  aubio is free software: you can redistribute it and/or modify
7  it under the terms of the GNU General Public License as published by
8  the Free Software Foundation, either version 3 of the License, or
9  (at your option) any later version.
[96fb8ad]10
[e6a78ea]11  aubio is distributed in the hope that it will be useful,
12  but WITHOUT ANY WARRANTY; without even the implied warranty of
13  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
14  GNU General Public License for more details.
15
16  You should have received a copy of the GNU General Public License
17  along with aubio.  If not, see <http://www.gnu.org/licenses/>.
[96fb8ad]18
19*/
20
21#include "aubio_priv.h"
[aadd27a]22#include "fvec.h"
23#include "cvec.h"
[96fb8ad]24#include "mathutils.h"
[32d6958]25#include "spectral/fft.h"
[96fb8ad]26
[54dd945]27#ifdef HAVE_FFTW3             // using FFTW3
[f3bee79]28/* note that <complex.h> is not included here but only in aubio_priv.h, so that
29 * c++ projects can still use their own complex definition. */
30#include <fftw3.h>
[d453a4a]31#include <pthread.h>
[f3bee79]32
33#ifdef HAVE_COMPLEX_H
[729a3c0]34#ifdef HAVE_FFTW3F
[f3bee79]35/** fft data type with complex.h and fftw3f */
36#define FFTW_TYPE fftwf_complex
37#else
38/** fft data type with complex.h and fftw3 */
39#define FFTW_TYPE fftw_complex
40#endif
41#else
[729a3c0]42#ifdef HAVE_FFTW3F
[f3bee79]43/** fft data type without complex.h and with fftw3f */
44#define FFTW_TYPE float
45#else
46/** fft data type without complex.h and with fftw */
47#define FFTW_TYPE double
48#endif
49#endif
50
51/** fft data type */
52typedef FFTW_TYPE fft_data_t;
53
[729a3c0]54#ifdef HAVE_FFTW3F
[a47cd35]55#define fftw_malloc            fftwf_malloc
56#define fftw_free              fftwf_free
57#define fftw_execute           fftwf_execute
58#define fftw_plan_dft_r2c_1d   fftwf_plan_dft_r2c_1d
59#define fftw_plan_dft_c2r_1d   fftwf_plan_dft_c2r_1d
60#define fftw_plan_r2r_1d       fftwf_plan_r2r_1d
61#define fftw_plan              fftwf_plan
62#define fftw_destroy_plan      fftwf_destroy_plan
[96fb8ad]63#endif
64
[729a3c0]65#ifdef HAVE_FFTW3F
[c204928]66#if HAVE_AUBIO_DOUBLE
[4369cb9]67#warning "Using aubio in double precision with fftw3 in single precision"
[fd6b90f]68#endif /* HAVE_AUBIO_DOUBLE */
[4369cb9]69#define real_t float
[fd6b90f]70#else /* HAVE_FFTW3F */
[c204928]71#if !HAVE_AUBIO_DOUBLE
[fd6b90f]72#warning "Using aubio in single precision with fftw3 in double precision"
73#endif /* HAVE_AUBIO_DOUBLE */
[4369cb9]74#define real_t double
[fd6b90f]75#endif /* HAVE_FFTW3F */
[96fb8ad]76
[d453a4a]77// a global mutex for FFTW thread safety
78pthread_mutex_t aubio_fftw_mutex = PTHREAD_MUTEX_INITIALIZER;
79
[54dd945]80#else
81#ifdef HAVE_ACCELERATE        // using ACCELERATE
82// https://developer.apple.com/library/mac/#documentation/Accelerate/Reference/vDSPRef/Reference/reference.html
83#include <Accelerate/Accelerate.h>
84
85#else                         // using OOURA
86// let's use ooura instead
87extern void rdft(int, int, double *, int *, double *);
88
89#endif /* HAVE_ACCELERATE */
[729a3c0]90#endif /* HAVE_FFTW3 */
91
[96fb8ad]92struct _aubio_fft_t {
[aadd27a]93  uint_t winsize;
94  uint_t fft_size;
[54dd945]95#ifdef HAVE_FFTW3             // using FFTW3
[aadd27a]96  real_t *in, *out;
[4b6937b]97  fftw_plan pfw, pbw;
[aadd27a]98  fft_data_t * specdata;     /* complex spectral data */
[729a3c0]99#else
[54dd945]100#ifdef HAVE_ACCELERATE        // using ACCELERATE
101  int log2fftsize;
[69c39ca]102#if !HAVE_AUBIO_DOUBLE
[54dd945]103  FFTSetup fftSetup;
104  DSPSplitComplex spec;
105  float *in, *out;
[69c39ca]106#else
107  FFTSetupD fftSetup;
108  DSPDoubleSplitComplex spec;
109  double *in, *out;
110#endif
[54dd945]111#else                         // using OOURA
[729a3c0]112  double *in, *out;
113  double *w;
114  int *ip;
[54dd945]115#endif /* HAVE_ACCELERATE */
[729a3c0]116#endif /* HAVE_FFTW3 */
[aadd27a]117  fvec_t * compspec;
[96fb8ad]118};
119
[729a3c0]120aubio_fft_t * new_aubio_fft (uint_t winsize) {
[a47cd35]121  aubio_fft_t * s = AUBIO_NEW(aubio_fft_t);
[729a3c0]122#ifdef HAVE_FFTW3
[8b3a7e7]123  uint_t i;
[aadd27a]124  s->winsize  = winsize;
[a47cd35]125  /* allocate memory */
[aadd27a]126  s->in       = AUBIO_ARRAY(real_t,winsize);
127  s->out      = AUBIO_ARRAY(real_t,winsize);
[d95ff38]128  s->compspec = new_fvec(winsize);
[a47cd35]129  /* create plans */
[d453a4a]130  pthread_mutex_lock(&aubio_fftw_mutex);
[237f632]131#ifdef HAVE_COMPLEX_H
[4b6937b]132  s->fft_size = winsize/2 + 1;
[a47cd35]133  s->specdata = (fft_data_t*)fftw_malloc(sizeof(fft_data_t)*s->fft_size);
[aadd27a]134  s->pfw = fftw_plan_dft_r2c_1d(winsize, s->in,  s->specdata, FFTW_ESTIMATE);
135  s->pbw = fftw_plan_dft_c2r_1d(winsize, s->specdata, s->out, FFTW_ESTIMATE);
[237f632]136#else
[aadd27a]137  s->fft_size = winsize;
[a47cd35]138  s->specdata = (fft_data_t*)fftw_malloc(sizeof(fft_data_t)*s->fft_size);
[aadd27a]139  s->pfw = fftw_plan_r2r_1d(winsize, s->in,  s->specdata, FFTW_R2HC, FFTW_ESTIMATE);
140  s->pbw = fftw_plan_r2r_1d(winsize, s->specdata, s->out, FFTW_HC2R, FFTW_ESTIMATE);
[237f632]141#endif
[d453a4a]142  pthread_mutex_unlock(&aubio_fftw_mutex);
[4f4299d]143  for (i = 0; i < s->winsize; i++) {
144    s->in[i] = 0.;
145    s->out[i] = 0.;
146  }
147  for (i = 0; i < s->fft_size; i++) {
148    s->specdata[i] = 0.;
149  }
[729a3c0]150#else
[54dd945]151#ifdef HAVE_ACCELERATE        // using ACCELERATE
152  s->winsize = winsize;
153  s->fft_size = winsize;
154  s->compspec = new_fvec(winsize);
155  s->log2fftsize = (uint_t)log2f(s->fft_size);
[69c39ca]156#if !HAVE_AUBIO_DOUBLE
[54dd945]157  s->in = AUBIO_ARRAY(float, s->fft_size);
158  s->out = AUBIO_ARRAY(float, s->fft_size);
159  s->spec.realp = AUBIO_ARRAY(float, s->fft_size/2);
160  s->spec.imagp = AUBIO_ARRAY(float, s->fft_size/2);
161  s->fftSetup = vDSP_create_fftsetup(s->log2fftsize, FFT_RADIX2);
[69c39ca]162#else
163  s->in = AUBIO_ARRAY(double, s->fft_size);
164  s->out = AUBIO_ARRAY(double, s->fft_size);
165  s->spec.realp = AUBIO_ARRAY(double, s->fft_size/2);
166  s->spec.imagp = AUBIO_ARRAY(double, s->fft_size/2);
167  s->fftSetup = vDSP_create_fftsetupD(s->log2fftsize, FFT_RADIX2);
168#endif
[54dd945]169#else                         // using OOURA
[729a3c0]170  s->winsize = winsize;
171  s->fft_size = winsize / 2 + 1;
172  s->compspec = new_fvec(winsize);
[f61c88a]173  s->in    = AUBIO_ARRAY(double, s->winsize);
174  s->out   = AUBIO_ARRAY(double, s->winsize);
[729a3c0]175  s->ip    = AUBIO_ARRAY(int   , s->fft_size);
176  s->w     = AUBIO_ARRAY(double, s->fft_size);
177  s->ip[0] = 0;
[54dd945]178#endif /* HAVE_ACCELERATE */
179#endif /* HAVE_FFTW3 */
[a47cd35]180  return s;
[96fb8ad]181}
182
183void del_aubio_fft(aubio_fft_t * s) {
[a47cd35]184  /* destroy data */
[aadd27a]185  del_fvec(s->compspec);
[54dd945]186#ifdef HAVE_FFTW3             // using FFTW3
[a47cd35]187  fftw_destroy_plan(s->pfw);
188  fftw_destroy_plan(s->pbw);
189  fftw_free(s->specdata);
[729a3c0]190#else /* HAVE_FFTW3 */
[54dd945]191#ifdef HAVE_ACCELERATE        // using ACCELERATE
192  AUBIO_FREE(s->spec.realp);
193  AUBIO_FREE(s->spec.imagp);
194#else                         // using OOURA
[729a3c0]195  AUBIO_FREE(s->w);
196  AUBIO_FREE(s->ip);
[54dd945]197#endif /* HAVE_ACCELERATE */
[729a3c0]198#endif /* HAVE_FFTW3 */
[a47cd35]199  AUBIO_FREE(s->out);
[729a3c0]200  AUBIO_FREE(s->in);
[a47cd35]201  AUBIO_FREE(s);
[96fb8ad]202}
203
[aadd27a]204void aubio_fft_do(aubio_fft_t * s, fvec_t * input, cvec_t * spectrum) {
205  aubio_fft_do_complex(s, input, s->compspec);
206  aubio_fft_get_spectrum(s->compspec, spectrum);
[96fb8ad]207}
208
[aadd27a]209void aubio_fft_rdo(aubio_fft_t * s, cvec_t * spectrum, fvec_t * output) {
210  aubio_fft_get_realimag(spectrum, s->compspec);
211  aubio_fft_rdo_complex(s, s->compspec, output);
[96fb8ad]212}
213
[aadd27a]214void aubio_fft_do_complex(aubio_fft_t * s, fvec_t * input, fvec_t * compspec) {
[729a3c0]215  uint_t i;
216  for (i=0; i < s->winsize; i++) {
217    s->in[i] = input->data[i];
[d95ff38]218  }
[54dd945]219#ifdef HAVE_FFTW3             // using FFTW3
[d95ff38]220  fftw_execute(s->pfw);
[4b6937b]221#ifdef HAVE_COMPLEX_H
[d95ff38]222  compspec->data[0] = REAL(s->specdata[0]);
[729a3c0]223  for (i = 1; i < s->fft_size -1 ; i++) {
224    compspec->data[i] = REAL(s->specdata[i]);
225    compspec->data[compspec->length - i] = IMAG(s->specdata[i]);
[d95ff38]226  }
227  compspec->data[s->fft_size-1] = REAL(s->specdata[s->fft_size-1]);
[729a3c0]228#else /* HAVE_COMPLEX_H  */
229  for (i = 0; i < s->fft_size; i++) {
230    compspec->data[i] = s->specdata[i];
[237f632]231  }
[729a3c0]232#endif /* HAVE_COMPLEX_H */
233#else /* HAVE_FFTW3 */
[54dd945]234#ifdef HAVE_ACCELERATE        // using ACCELERATE
[69c39ca]235#if !HAVE_AUBIO_DOUBLE
[54dd945]236  // convert real data to even/odd format used in vDSP
[69c39ca]237  vDSP_ctoz((DSPComplex*)s->in, 2, &s->spec, 1, s->fft_size/2);
[54dd945]238  // compute the FFT
239  vDSP_fft_zrip(s->fftSetup, &s->spec, 1, s->log2fftsize, FFT_FORWARD);
[69c39ca]240#else
241  // convert real data to even/odd format used in vDSP
242  vDSP_ctozD((DSPDoubleComplex*)s->in, 2, &s->spec, 1, s->fft_size/2);
243  // compute the FFT
244  vDSP_fft_zripD(s->fftSetup, &s->spec, 1, s->log2fftsize, FFT_FORWARD);
245#endif
[54dd945]246  // convert from vDSP complex split to [ r0, r1, ..., rN, iN-1, .., i2, i1]
247  compspec->data[0] = s->spec.realp[0];
248  compspec->data[s->fft_size / 2] = s->spec.imagp[0];
249  for (i = 1; i < s->fft_size / 2; i++) {
250    compspec->data[i] = s->spec.realp[i];
251    compspec->data[s->fft_size - i] = s->spec.imagp[i];
252  }
253  // apply scaling
254  smpl_t scale = 1./2.;
[69c39ca]255#if !HAVE_AUBIO_DOUBLE
[54dd945]256  vDSP_vsmul(compspec->data, 1, &scale, compspec->data, 1, s->fft_size);
[69c39ca]257#else
258  vDSP_vsmulD(compspec->data, 1, &scale, compspec->data, 1, s->fft_size);
259#endif
[54dd945]260#else                         // using OOURA
[729a3c0]261  rdft(s->winsize, 1, s->in, s->ip, s->w);
262  compspec->data[0] = s->in[0];
263  compspec->data[s->winsize / 2] = s->in[1];
264  for (i = 1; i < s->fft_size - 1; i++) {
265    compspec->data[i] = s->in[2 * i];
266    compspec->data[s->winsize - i] = - s->in[2 * i + 1];
267  }
[54dd945]268#endif /* HAVE_ACCELERATE */
[729a3c0]269#endif /* HAVE_FFTW3 */
[96fb8ad]270}
271
[aadd27a]272void aubio_fft_rdo_complex(aubio_fft_t * s, fvec_t * compspec, fvec_t * output) {
[729a3c0]273  uint_t i;
274#ifdef HAVE_FFTW3
[aadd27a]275  const smpl_t renorm = 1./(smpl_t)s->winsize;
[4b6937b]276#ifdef HAVE_COMPLEX_H
[d95ff38]277  s->specdata[0] = compspec->data[0];
[729a3c0]278  for (i=1; i < s->fft_size - 1; i++) {
279    s->specdata[i] = compspec->data[i] +
280      I * compspec->data[compspec->length - i];
[d95ff38]281  }
282  s->specdata[s->fft_size - 1] = compspec->data[s->fft_size - 1];
[237f632]283#else
[729a3c0]284  for (i=0; i < s->fft_size; i++) {
285    s->specdata[i] = compspec->data[i];
[d95ff38]286  }
[aadd27a]287#endif
[d95ff38]288  fftw_execute(s->pbw);
[729a3c0]289  for (i = 0; i < output->length; i++) {
290    output->data[i] = s->out[i]*renorm;
291  }
292#else /* HAVE_FFTW3 */
[54dd945]293#ifdef HAVE_ACCELERATE        // using ACCELERATE
294  // convert from real imag  [ r0, r1, ..., rN, iN-1, .., i2, i1]
295  // to vDSP packed format   [ r0, rN, r1, i1, ..., rN-1, iN-1 ]
296  s->out[0] = compspec->data[0];
297  s->out[1] = compspec->data[s->winsize / 2];
298  for (i = 1; i < s->fft_size / 2; i++) {
299    s->out[2 * i] = compspec->data[i];
300    s->out[2 * i + 1] = compspec->data[s->winsize - i];
301  }
[69c39ca]302#if !HAVE_AUBIO_DOUBLE
[54dd945]303  // convert to split complex format used in vDSP
[69c39ca]304  vDSP_ctoz((DSPComplex*)s->out, 2, &s->spec, 1, s->fft_size/2);
[54dd945]305  // compute the FFT
306  vDSP_fft_zrip(s->fftSetup, &s->spec, 1, s->log2fftsize, FFT_INVERSE);
307  // convert result to real output
[69c39ca]308  vDSP_ztoc(&s->spec, 1, (DSPComplex*)output->data, 2, s->fft_size/2);
[54dd945]309  // apply scaling
310  smpl_t scale = 1.0 / s->winsize;
311  vDSP_vsmul(output->data, 1, &scale, output->data, 1, s->fft_size);
[69c39ca]312#else
313  // convert to split complex format used in vDSP
314  vDSP_ctozD((DSPDoubleComplex*)s->out, 2, &s->spec, 1, s->fft_size/2);
315  // compute the FFT
316  vDSP_fft_zripD(s->fftSetup, &s->spec, 1, s->log2fftsize, FFT_INVERSE);
317  // convert result to real output
318  vDSP_ztocD(&s->spec, 1, (DSPDoubleComplex*)output->data, 2, s->fft_size/2);
319  // apply scaling
320  smpl_t scale = 1.0 / s->winsize;
321  vDSP_vsmulD(output->data, 1, &scale, output->data, 1, s->fft_size);
322#endif
[54dd945]323#else                         // using OOURA
[729a3c0]324  smpl_t scale = 2.0 / s->winsize;
325  s->out[0] = compspec->data[0];
326  s->out[1] = compspec->data[s->winsize / 2];
327  for (i = 1; i < s->fft_size - 1; i++) {
328    s->out[2 * i] = compspec->data[i];
329    s->out[2 * i + 1] = - compspec->data[s->winsize - i];
[aadd27a]330  }
[729a3c0]331  rdft(s->winsize, -1, s->out, s->ip, s->w);
332  for (i=0; i < s->winsize; i++) {
333    output->data[i] = s->out[i] * scale;
334  }
[54dd945]335#endif /* HAVE_ACCELERATE */
[729a3c0]336#endif /* HAVE_FFTW3 */
[237f632]337}
338
[aadd27a]339void aubio_fft_get_spectrum(fvec_t * compspec, cvec_t * spectrum) {
340  aubio_fft_get_phas(compspec, spectrum);
341  aubio_fft_get_norm(compspec, spectrum);
[237f632]342}
343
[aadd27a]344void aubio_fft_get_realimag(cvec_t * spectrum, fvec_t * compspec) {
345  aubio_fft_get_imag(spectrum, compspec);
346  aubio_fft_get_real(spectrum, compspec);
[237f632]347}
348
[aadd27a]349void aubio_fft_get_phas(fvec_t * compspec, cvec_t * spectrum) {
[729a3c0]350  uint_t i;
[d95ff38]351  if (compspec->data[0] < 0) {
352    spectrum->phas[0] = PI;
353  } else {
354    spectrum->phas[0] = 0.;
355  }
[729a3c0]356  for (i=1; i < spectrum->length - 1; i++) {
357    spectrum->phas[i] = ATAN2(compspec->data[compspec->length-i],
358        compspec->data[i]);
[d95ff38]359  }
360  if (compspec->data[compspec->length/2] < 0) {
361    spectrum->phas[spectrum->length - 1] = PI;
362  } else {
363    spectrum->phas[spectrum->length - 1] = 0.;
[aadd27a]364  }
[f88a326]365}
366
[aadd27a]367void aubio_fft_get_norm(fvec_t * compspec, cvec_t * spectrum) {
[729a3c0]368  uint_t i = 0;
[d95ff38]369  spectrum->norm[0] = ABS(compspec->data[0]);
[729a3c0]370  for (i=1; i < spectrum->length - 1; i++) {
371    spectrum->norm[i] = SQRT(SQR(compspec->data[i])
372        + SQR(compspec->data[compspec->length - i]) );
[a47cd35]373  }
[729a3c0]374  spectrum->norm[spectrum->length-1] =
[d95ff38]375    ABS(compspec->data[compspec->length/2]);
[f88a326]376}
377
[aadd27a]378void aubio_fft_get_imag(cvec_t * spectrum, fvec_t * compspec) {
[729a3c0]379  uint_t i;
380  for (i = 1; i < ( compspec->length + 1 ) / 2 /*- 1 + 1*/; i++) {
381    compspec->data[compspec->length - i] =
382      spectrum->norm[i]*SIN(spectrum->phas[i]);
[a47cd35]383  }
[f88a326]384}
385
[aadd27a]386void aubio_fft_get_real(cvec_t * spectrum, fvec_t * compspec) {
[729a3c0]387  uint_t i;
388  for (i = 0; i < compspec->length / 2 + 1; i++) {
389    compspec->data[i] = 
390      spectrum->norm[i]*COS(spectrum->phas[i]);
[aadd27a]391  }
[f88a326]392}
Note: See TracBrowser for help on using the repository browser.