source: src/spectral/mfcc.c @ c879811

feature/autosinkfeature/cnnfeature/cnn_orgfeature/constantqfeature/crepefeature/crepe_orgfeature/pitchshiftfeature/pydocstringsfeature/timestretchfix/ffmpeg5
Last change on this file since c879811 was c879811, checked in by Paul Brossier <piem@piem.org>, 5 years ago

[mfcc] add slaney mode takes no params

  • Property mode set to 100644
File size: 4.6 KB
RevLine 
[88199ce]1/*
[7a84b21]2  Copyright (C) 2007-2009 Paul Brossier <piem@aubio.org>
3                      and Amaury Hazan <ahazan@iua.upf.edu>
[88199ce]4
[1c2e186]5  This file is part of aubio.
[88199ce]6
[1c2e186]7  aubio is free software: you can redistribute it and/or modify
[7a84b21]8  it under the terms of the GNU General Public License as published by
9  the Free Software Foundation, either version 3 of the License, or
10  (at your option) any later version.
[88199ce]11
[1c2e186]12  aubio is distributed in the hope that it will be useful,
[7a84b21]13  but WITHOUT ANY WARRANTY; without even the implied warranty of
14  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
15  GNU General Public License for more details.
16
17  You should have received a copy of the GNU General Public License
[1c2e186]18  along with aubio.  If not, see <http://www.gnu.org/licenses/>.
[88199ce]19
20*/
21
[7c6c806d]22#include "aubio_priv.h"
[6c7d49b]23#include "fvec.h"
[d95ff38]24#include "fmat.h"
[6c7d49b]25#include "cvec.h"
[d37400c]26#include "mathutils.h"
[d0dca26]27#include "vecutils.h"
[32d6958]28#include "spectral/fft.h"
[d90db7d4]29#include "spectral/filterbank.h"
[06cae6c]30#include "spectral/filterbank_mel.h"
[d8b1161]31#include "spectral/dct.h"
[32d6958]32#include "spectral/mfcc.h"
[88199ce]33
[8428a52]34#ifdef HAVE_NOOPT
35#define HAVE_SLOW_DCT 1
36#endif
[d8b1161]37
[7a84b21]38/** Internal structure for mfcc object */
[88199ce]39
[d99d819]40struct _aubio_mfcc_t
[7a84b21]41{
[34d72f0]42  uint_t win_s;             /** grain length */
43  uint_t samplerate;        /** sample rate (needed?) */
[f2a0769]44  uint_t n_filters;         /** number of filters */
[7a46bf6]45  uint_t n_coefs;           /** number of coefficients (<= n_filters/2 +1) */
[7a84b21]46  aubio_filterbank_t *fb;   /** filter bank */
47  fvec_t *in_dct;           /** input buffer for dct * [fb->n_filters] */
[d8b1161]48#if defined(HAVE_SLOW_DCT)
[d95ff38]49  fmat_t *dct_coeffs;       /** DCT transform n_filters * n_coeffs */
[d8b1161]50#else
51  aubio_dct_t *dct;
52  fvec_t *output;
53#endif
[d66d2ac]54  smpl_t scale;
[8708556]55};
56
57
[7a84b21]58aubio_mfcc_t *
[41bf913]59new_aubio_mfcc (uint_t win_s, uint_t n_filters, uint_t n_coefs,
60    uint_t samplerate)
[7a84b21]61{
62
63  /* allocate space for mfcc object */
64  aubio_mfcc_t *mfcc = AUBIO_NEW (aubio_mfcc_t);
[d8b1161]65#if defined(HAVE_SLOW_DCT)
[78c21cf]66  smpl_t scaling;
[c185ebb]67
68  uint_t i, j;
[d8b1161]69#endif
[c185ebb]70
[7a84b21]71  mfcc->win_s = win_s;
72  mfcc->samplerate = samplerate;
73  mfcc->n_filters = n_filters;
74  mfcc->n_coefs = n_coefs;
[cfe4038]75
[7a84b21]76  /* filterbank allocation */
77  mfcc->fb = new_aubio_filterbank (n_filters, mfcc->win_s);
78  aubio_filterbank_set_mel_coeffs_slaney (mfcc->fb, samplerate);
[8708556]79
[7a84b21]80  /* allocating buffers */
[d95ff38]81  mfcc->in_dct = new_fvec (n_filters);
[8708556]82
[d8b1161]83#if defined(HAVE_SLOW_DCT)
[c02a1cc]84  mfcc->dct_coeffs = new_fmat (n_coefs, n_filters);
[c185ebb]85
[c02a1cc]86  /* compute DCT transform dct_coeffs[j][i] as
[7a84b21]87     cos ( j * (i+.5) * PI / n_filters ) */
[78c21cf]88  scaling = 1. / SQRT (n_filters / 2.);
[7a84b21]89  for (i = 0; i < n_filters; i++) {
[c185ebb]90    for (j = 0; j < n_coefs; j++) {
[c02a1cc]91      mfcc->dct_coeffs->data[j][i] =
[7a84b21]92          scaling * COS (j * (i + 0.5) * PI / n_filters);
[c185ebb]93    }
[c02a1cc]94    mfcc->dct_coeffs->data[0][i] *= SQRT (2.) / 2.;
[c185ebb]95  }
[d8b1161]96#else
97  mfcc->dct = new_aubio_dct (n_filters);
98  mfcc->output = new_fvec (n_filters);
99#endif
[8708556]100
[d66d2ac]101  mfcc->scale = 1.;
102
[8708556]103  return mfcc;
[163d159]104}
[8708556]105
[7a84b21]106void
107del_aubio_mfcc (aubio_mfcc_t * mf)
108{
109
110  /* delete filterbank */
111  del_aubio_filterbank (mf->fb);
112
113  /* delete buffers */
114  del_fvec (mf->in_dct);
[d8b1161]115#if defined(HAVE_SLOW_DCT)
[fc759f3]116  del_fmat (mf->dct_coeffs);
[d8b1161]117#else
118  del_aubio_dct (mf->dct);
119  del_fvec (mf->output);
120#endif
[7a84b21]121
122  /* delete mfcc object */
123  AUBIO_FREE (mf);
[88199ce]124}
125
[177f09a]126
[7a84b21]127void
[feb694b]128aubio_mfcc_do (aubio_mfcc_t * mf, const cvec_t * in, fvec_t * out)
[7a84b21]129{
[3aa60b2]130#ifndef HAVE_SLOW_DCT
131  fvec_t tmp;
132#endif
[d66d2ac]133
[7a84b21]134  /* compute filterbank */
135  aubio_filterbank_do (mf->fb, in, mf->in_dct);
[c185ebb]136
[d37400c]137  /* compute log10 */
138  fvec_log10 (mf->in_dct);
139
[d66d2ac]140  if (mf->scale != 1) fvec_mul (mf->in_dct, mf->scale);
[d37400c]141
[73e8f65]142  /* compute mfccs */
[d8b1161]143#if defined(HAVE_SLOW_DCT)
[73e8f65]144  fmat_vecmul(mf->dct_coeffs, mf->in_dct, out);
[d8b1161]145#else
146  aubio_dct_do(mf->dct, mf->in_dct, mf->output);
147  // copy only first n_coeffs elements
148  // TODO assert mf->output->length == n_coeffs
149  tmp.data = mf->output->data;
150  tmp.length = out->length;
151  fvec_copy(&tmp, out);
152#endif
[cfe4038]153
[c185ebb]154  return;
155}
[517630f]156
157uint_t aubio_mfcc_set_power (aubio_mfcc_t *mf, smpl_t power)
158{
159  return aubio_filterbank_set_power(mf->fb, power);
160}
161
162uint_t aubio_mfcc_get_power (aubio_mfcc_t *mf)
163{
164  return aubio_filterbank_get_power(mf->fb);
165}
166
[d66d2ac]167uint_t aubio_mfcc_set_scale (aubio_mfcc_t *mf, smpl_t scale)
168{
169  mf->scale = scale;
170  return AUBIO_OK;
171}
172
173uint_t aubio_mfcc_get_scale (aubio_mfcc_t *mf)
174{
175  return mf->scale;
176}
177
[517630f]178uint_t aubio_mfcc_set_mel_coeffs (aubio_mfcc_t *mf, smpl_t freq_min,
179    smpl_t freq_max)
180{
181  return aubio_filterbank_set_mel_coeffs(mf->fb, mf->samplerate,
182      freq_min, freq_max);
183}
184
185uint_t aubio_mfcc_set_mel_coeffs_htk (aubio_mfcc_t *mf, smpl_t freq_min,
186    smpl_t freq_max)
187{
188  return aubio_filterbank_set_mel_coeffs_htk(mf->fb, mf->samplerate,
189      freq_min, freq_max);
190}
[10fafc2]191
[c879811]192uint_t aubio_mfcc_set_mel_coeffs_slaney (aubio_mfcc_t *mf)
[10fafc2]193{
194  return aubio_filterbank_set_mel_coeffs_slaney (mf->fb, mf->samplerate);
195}
Note: See TracBrowser for help on using the repository browser.