source: src/spectral/mfcc.c @ 21067f9

feature/autosinkfeature/cnnfeature/cnn_orgfeature/constantqfeature/crepefeature/crepe_orgfeature/pitchshiftfeature/pydocstringsfeature/timestretchfix/ffmpeg5
Last change on this file since 21067f9 was d66d2ac, checked in by Paul Brossier <piem@piem.org>, 6 years ago

[mfcc] remove note about power, add scale

  • Property mode set to 100644
File size: 4.7 KB
Line 
1/*
2  Copyright (C) 2007-2009 Paul Brossier <piem@aubio.org>
3                      and Amaury Hazan <ahazan@iua.upf.edu>
4
5  This file is part of aubio.
6
7  aubio is free software: you can redistribute it and/or modify
8  it under the terms of the GNU General Public License as published by
9  the Free Software Foundation, either version 3 of the License, or
10  (at your option) any later version.
11
12  aubio is distributed in the hope that it will be useful,
13  but WITHOUT ANY WARRANTY; without even the implied warranty of
14  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
15  GNU General Public License for more details.
16
17  You should have received a copy of the GNU General Public License
18  along with aubio.  If not, see <http://www.gnu.org/licenses/>.
19
20*/
21
22#include "aubio_priv.h"
23#include "fvec.h"
24#include "fmat.h"
25#include "cvec.h"
26#include "mathutils.h"
27#include "vecutils.h"
28#include "spectral/fft.h"
29#include "spectral/filterbank.h"
30#include "spectral/filterbank_mel.h"
31#include "spectral/dct.h"
32#include "spectral/mfcc.h"
33
34#ifdef HAVE_NOOPT
35#define HAVE_SLOW_DCT 1
36#endif
37
38/** Internal structure for mfcc object */
39
40struct _aubio_mfcc_t
41{
42  uint_t win_s;             /** grain length */
43  uint_t samplerate;        /** sample rate (needed?) */
44  uint_t n_filters;         /** number of filters */
45  uint_t n_coefs;           /** number of coefficients (<= n_filters/2 +1) */
46  aubio_filterbank_t *fb;   /** filter bank */
47  fvec_t *in_dct;           /** input buffer for dct * [fb->n_filters] */
48#if defined(HAVE_SLOW_DCT)
49  fmat_t *dct_coeffs;       /** DCT transform n_filters * n_coeffs */
50#else
51  aubio_dct_t *dct;
52  fvec_t *output;
53#endif
54  smpl_t scale;
55};
56
57
58aubio_mfcc_t *
59new_aubio_mfcc (uint_t win_s, uint_t n_filters, uint_t n_coefs,
60    uint_t samplerate)
61{
62
63  /* allocate space for mfcc object */
64  aubio_mfcc_t *mfcc = AUBIO_NEW (aubio_mfcc_t);
65#if defined(HAVE_SLOW_DCT)
66  smpl_t scaling;
67
68  uint_t i, j;
69#endif
70
71  mfcc->win_s = win_s;
72  mfcc->samplerate = samplerate;
73  mfcc->n_filters = n_filters;
74  mfcc->n_coefs = n_coefs;
75
76  /* filterbank allocation */
77  mfcc->fb = new_aubio_filterbank (n_filters, mfcc->win_s);
78  aubio_filterbank_set_mel_coeffs_slaney (mfcc->fb, samplerate);
79
80  /* allocating buffers */
81  mfcc->in_dct = new_fvec (n_filters);
82
83#if defined(HAVE_SLOW_DCT)
84  mfcc->dct_coeffs = new_fmat (n_coefs, n_filters);
85
86  /* compute DCT transform dct_coeffs[j][i] as
87     cos ( j * (i+.5) * PI / n_filters ) */
88  scaling = 1. / SQRT (n_filters / 2.);
89  for (i = 0; i < n_filters; i++) {
90    for (j = 0; j < n_coefs; j++) {
91      mfcc->dct_coeffs->data[j][i] =
92          scaling * COS (j * (i + 0.5) * PI / n_filters);
93    }
94    mfcc->dct_coeffs->data[0][i] *= SQRT (2.) / 2.;
95  }
96#else
97  mfcc->dct = new_aubio_dct (n_filters);
98  mfcc->output = new_fvec (n_filters);
99#endif
100
101  mfcc->scale = 1.;
102
103  return mfcc;
104}
105
106void
107del_aubio_mfcc (aubio_mfcc_t * mf)
108{
109
110  /* delete filterbank */
111  del_aubio_filterbank (mf->fb);
112
113  /* delete buffers */
114  del_fvec (mf->in_dct);
115#if defined(HAVE_SLOW_DCT)
116  del_fmat (mf->dct_coeffs);
117#else
118  del_aubio_dct (mf->dct);
119  del_fvec (mf->output);
120#endif
121
122  /* delete mfcc object */
123  AUBIO_FREE (mf);
124}
125
126
127void
128aubio_mfcc_do (aubio_mfcc_t * mf, const cvec_t * in, fvec_t * out)
129{
130#ifndef HAVE_SLOW_DCT
131  fvec_t tmp;
132#endif
133
134  /* compute filterbank */
135  aubio_filterbank_do (mf->fb, in, mf->in_dct);
136
137  /* compute log10 */
138  fvec_log10 (mf->in_dct);
139
140  if (mf->scale != 1) fvec_mul (mf->in_dct, mf->scale);
141
142  /* compute mfccs */
143#if defined(HAVE_SLOW_DCT)
144  fmat_vecmul(mf->dct_coeffs, mf->in_dct, out);
145#else
146  aubio_dct_do(mf->dct, mf->in_dct, mf->output);
147  // copy only first n_coeffs elements
148  // TODO assert mf->output->length == n_coeffs
149  tmp.data = mf->output->data;
150  tmp.length = out->length;
151  fvec_copy(&tmp, out);
152#endif
153
154  return;
155}
156
157uint_t aubio_mfcc_set_power (aubio_mfcc_t *mf, smpl_t power)
158{
159  return aubio_filterbank_set_power(mf->fb, power);
160}
161
162uint_t aubio_mfcc_get_power (aubio_mfcc_t *mf)
163{
164  return aubio_filterbank_get_power(mf->fb);
165}
166
167uint_t aubio_mfcc_set_scale (aubio_mfcc_t *mf, smpl_t scale)
168{
169  mf->scale = scale;
170  return AUBIO_OK;
171}
172
173uint_t aubio_mfcc_get_scale (aubio_mfcc_t *mf)
174{
175  return mf->scale;
176}
177
178uint_t aubio_mfcc_set_mel_coeffs (aubio_mfcc_t *mf, smpl_t freq_min,
179    smpl_t freq_max)
180{
181  return aubio_filterbank_set_mel_coeffs(mf->fb, mf->samplerate,
182      freq_min, freq_max);
183}
184
185uint_t aubio_mfcc_set_mel_coeffs_htk (aubio_mfcc_t *mf, smpl_t freq_min,
186    smpl_t freq_max)
187{
188  return aubio_filterbank_set_mel_coeffs_htk(mf->fb, mf->samplerate,
189      freq_min, freq_max);
190}
191
192uint_t aubio_mfcc_set_mel_coeffs_slaney (aubio_mfcc_t *mf, smpl_t freq_min,
193    smpl_t freq_max)
194{
195  return aubio_filterbank_set_mel_coeffs_slaney (mf->fb, mf->samplerate);
196}
Note: See TracBrowser for help on using the repository browser.