source: src/pitch/pitch.c @ 52b5f34

feature/autosinkfeature/cnnfeature/cnn_orgfeature/constantqfeature/crepefeature/crepe_orgfeature/pitchshiftfeature/pydocstringsfeature/timestretchfix/ffmpeg5pitchshiftsamplertimestretchyinfft+
Last change on this file since 52b5f34 was 8c3f717, checked in by Paul Brossier <piem@piem.org>, 12 years ago

src/pitch/pitch.{c,h}: add silence gate, default at -50dB

  • Property mode set to 100644
File size: 12.5 KB
Line 
1/*
2  Copyright (C) 2003-2009 Paul Brossier <piem@aubio.org>
3
4  This file is part of aubio.
5
6  aubio is free software: you can redistribute it and/or modify
7  it under the terms of the GNU General Public License as published by
8  the Free Software Foundation, either version 3 of the License, or
9  (at your option) any later version.
10
11  aubio is distributed in the hope that it will be useful,
12  but WITHOUT ANY WARRANTY; without even the implied warranty of
13  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
14  GNU General Public License for more details.
15
16  You should have received a copy of the GNU General Public License
17  along with aubio.  If not, see <http://www.gnu.org/licenses/>.
18
19*/
20
21#include "aubio_priv.h"
22#include "fvec.h"
23#include "cvec.h"
24#include "lvec.h"
25#include "mathutils.h"
26#include "musicutils.h"
27#include "spectral/phasevoc.h"
28#include "temporal/filter.h"
29#include "temporal/c_weighting.h"
30#include "pitch/pitchmcomb.h"
31#include "pitch/pitchyin.h"
32#include "pitch/pitchfcomb.h"
33#include "pitch/pitchschmitt.h"
34#include "pitch/pitchyinfft.h"
35#include "pitch/pitchspecacf.h"
36#include "pitch/pitch.h"
37
38#define DEFAULT_PITCH_SILENCE -50.
39
40/** pitch detection algorithms */
41typedef enum
42{
43  aubio_pitcht_yin,        /**< `yin`, YIN algorithm */
44  aubio_pitcht_mcomb,      /**< `mcomb`, Multi-comb filter */
45  aubio_pitcht_schmitt,    /**< `schmitt`, Schmitt trigger */
46  aubio_pitcht_fcomb,      /**< `fcomb`, Fast comb filter */
47  aubio_pitcht_yinfft,     /**< `yinfft`, Spectral YIN */
48  aubio_pitcht_specacf,    /**< `specacf`, Spectral autocorrelation */
49  aubio_pitcht_default
50    = aubio_pitcht_yinfft, /**< `default` */
51} aubio_pitch_type;
52
53/** pitch detection output modes */
54typedef enum
55{
56  aubio_pitchm_freq,   /**< Frequency (Hz) */
57  aubio_pitchm_midi,   /**< MIDI note (0.,127) */
58  aubio_pitchm_cent,   /**< Cent */
59  aubio_pitchm_bin,    /**< Frequency bin (0,bufsize) */
60  aubio_pitchm_default = aubio_pitchm_freq, /**< the one used when "default" is asked */
61} aubio_pitch_mode;
62
63/** callback to get pitch candidate, defined below */
64typedef void (*aubio_pitch_detect_t) (aubio_pitch_t * p, fvec_t * ibuf, fvec_t * obuf);
65
66/** callback to convert pitch from one unit to another, defined below */
67typedef smpl_t(*aubio_pitch_convert_t) (smpl_t value, uint_t samplerate, uint_t bufsize);
68
69/** callback to fetch the confidence of the algorithm */
70typedef smpl_t (*aubio_pitch_get_conf_t) (void * p);
71
72/** generic pitch detection structure */
73struct _aubio_pitch_t
74{
75  aubio_pitch_type type;          /**< pitch detection mode */
76  aubio_pitch_mode mode;          /**< pitch detection output mode */
77  uint_t samplerate;              /**< samplerate */
78  uint_t bufsize;                 /**< buffer size */
79  void *p_object;                 /**< pointer to pitch object */
80  aubio_filter_t *filter;         /**< filter */
81  aubio_pvoc_t *pv;               /**< phase vocoder for mcomb */
82  cvec_t *fftgrain;               /**< spectral frame for mcomb */
83  fvec_t *buf;                    /**< temporary buffer for yin */
84  aubio_pitch_detect_t detect_cb; /**< callback to get the pitch candidates */
85  aubio_pitch_convert_t conv_cb;  /**< callback to convert it to the desired unit */
86  aubio_pitch_get_conf_t conf_cb; /**< pointer to the current confidence callback */
87  smpl_t silence;                 /**< silence threshold */
88};
89
90/* callback functions for pitch detection */
91static void aubio_pitch_do_mcomb (aubio_pitch_t * p, fvec_t * ibuf, fvec_t * obuf);
92static void aubio_pitch_do_yin (aubio_pitch_t * p, fvec_t * ibuf, fvec_t * obuf);
93static void aubio_pitch_do_schmitt (aubio_pitch_t * p, fvec_t * ibuf, fvec_t * obuf);
94static void aubio_pitch_do_fcomb (aubio_pitch_t * p, fvec_t * ibuf, fvec_t * obuf);
95static void aubio_pitch_do_yinfft (aubio_pitch_t * p, fvec_t * ibuf, fvec_t * obuf);
96static void aubio_pitch_do_specacf (aubio_pitch_t * p, fvec_t * ibuf, fvec_t * obuf);
97
98/* conversion functions for frequency conversions */
99smpl_t freqconvbin (smpl_t f, uint_t samplerate, uint_t bufsize);
100smpl_t freqconvmidi (smpl_t f, uint_t samplerate, uint_t bufsize);
101smpl_t freqconvpass (smpl_t f, uint_t samplerate, uint_t bufsize);
102
103/* adapter to stack ibuf new samples at the end of buf, and trim `buf` to `bufsize` */
104void aubio_pitch_slideblock (aubio_pitch_t * p, fvec_t * ibuf);
105
106
107aubio_pitch_t *
108new_aubio_pitch (char_t * pitch_mode,
109    uint_t bufsize, uint_t hopsize, uint_t samplerate)
110{
111  aubio_pitch_t *p = AUBIO_NEW (aubio_pitch_t);
112  aubio_pitch_type pitch_type;
113  if (strcmp (pitch_mode, "mcomb") == 0)
114    pitch_type = aubio_pitcht_mcomb;
115  else if (strcmp (pitch_mode, "yinfft") == 0)
116    pitch_type = aubio_pitcht_yinfft;
117  else if (strcmp (pitch_mode, "yin") == 0)
118    pitch_type = aubio_pitcht_yin;
119  else if (strcmp (pitch_mode, "schmitt") == 0)
120    pitch_type = aubio_pitcht_schmitt;
121  else if (strcmp (pitch_mode, "fcomb") == 0)
122    pitch_type = aubio_pitcht_fcomb;
123  else if (strcmp (pitch_mode, "specacf") == 0)
124    pitch_type = aubio_pitcht_specacf;
125  else if (strcmp (pitch_mode, "default") == 0)
126    pitch_type = aubio_pitcht_default;
127  else {
128    AUBIO_ERR ("unknown pitch detection method %s, using default.\n",
129        pitch_mode);
130    pitch_type = aubio_pitcht_default;
131  }
132  p->samplerate = samplerate;
133  p->type = pitch_type;
134  aubio_pitch_set_unit (p, "default");
135  p->bufsize = bufsize;
136  p->silence = DEFAULT_PITCH_SILENCE;
137  p->conf_cb = NULL;
138  switch (p->type) {
139    case aubio_pitcht_yin:
140      p->buf = new_fvec (bufsize);
141      p->p_object = new_aubio_pitchyin (bufsize);
142      p->detect_cb = aubio_pitch_do_yin;
143      p->conf_cb = (aubio_pitch_get_conf_t)aubio_pitchyin_get_confidence;
144      aubio_pitchyin_set_tolerance (p->p_object, 0.15);
145      break;
146    case aubio_pitcht_mcomb:
147      p->pv = new_aubio_pvoc (bufsize, hopsize);
148      p->fftgrain = new_cvec (bufsize);
149      p->p_object = new_aubio_pitchmcomb (bufsize, hopsize);
150      p->filter = new_aubio_filter_c_weighting (samplerate);
151      p->detect_cb = aubio_pitch_do_mcomb;
152      break;
153    case aubio_pitcht_fcomb:
154      p->buf = new_fvec (bufsize);
155      p->p_object = new_aubio_pitchfcomb (bufsize, hopsize);
156      p->detect_cb = aubio_pitch_do_fcomb;
157      break;
158    case aubio_pitcht_schmitt:
159      p->buf = new_fvec (bufsize);
160      p->p_object = new_aubio_pitchschmitt (bufsize);
161      p->detect_cb = aubio_pitch_do_schmitt;
162      break;
163    case aubio_pitcht_yinfft:
164      p->buf = new_fvec (bufsize);
165      p->p_object = new_aubio_pitchyinfft (samplerate, bufsize);
166      p->detect_cb = aubio_pitch_do_yinfft;
167      p->conf_cb = (aubio_pitch_get_conf_t)aubio_pitchyinfft_get_confidence;
168      aubio_pitchyinfft_set_tolerance (p->p_object, 0.85);
169      break;
170    case aubio_pitcht_specacf:
171      p->buf = new_fvec (bufsize);
172      p->p_object = new_aubio_pitchspecacf (bufsize);
173      p->detect_cb = aubio_pitch_do_specacf;
174      p->conf_cb = (aubio_pitch_get_conf_t)aubio_pitchspecacf_get_tolerance;
175      aubio_pitchspecacf_set_tolerance (p->p_object, 0.85);
176      break;
177    default:
178      break;
179  }
180  return p;
181}
182
183void
184del_aubio_pitch (aubio_pitch_t * p)
185{
186  switch (p->type) {
187    case aubio_pitcht_yin:
188      del_fvec (p->buf);
189      del_aubio_pitchyin (p->p_object);
190      break;
191    case aubio_pitcht_mcomb:
192      del_aubio_pvoc (p->pv);
193      del_cvec (p->fftgrain);
194      del_aubio_filter (p->filter);
195      del_aubio_pitchmcomb (p->p_object);
196      break;
197    case aubio_pitcht_schmitt:
198      del_fvec (p->buf);
199      del_aubio_pitchschmitt (p->p_object);
200      break;
201    case aubio_pitcht_fcomb:
202      del_fvec (p->buf);
203      del_aubio_pitchfcomb (p->p_object);
204      break;
205    case aubio_pitcht_yinfft:
206      del_fvec (p->buf);
207      del_aubio_pitchyinfft (p->p_object);
208      break;
209    case aubio_pitcht_specacf:
210      del_fvec (p->buf);
211      del_aubio_pitchspecacf (p->p_object);
212      break;
213    default:
214      break;
215  }
216  AUBIO_FREE (p);
217}
218
219void
220aubio_pitch_slideblock (aubio_pitch_t * p, fvec_t * ibuf)
221{
222  uint_t j = 0, overlap_size = 0;
223  overlap_size = p->buf->length - ibuf->length;
224  for (j = 0; j < overlap_size; j++) {
225    p->buf->data[j] = p->buf->data[j + ibuf->length];
226  }
227  for (j = 0; j < ibuf->length; j++) {
228    p->buf->data[j + overlap_size] = ibuf->data[j];
229  }
230}
231
232uint_t
233aubio_pitch_set_unit (aubio_pitch_t * p, char_t * pitch_unit)
234{
235  aubio_pitch_mode pitch_mode;
236  if (strcmp (pitch_unit, "freq") == 0)
237    pitch_mode = aubio_pitchm_freq;
238  else if (strcmp (pitch_unit, "midi") == 0)
239    pitch_mode = aubio_pitchm_midi;
240  else if (strcmp (pitch_unit, "cent") == 0)
241    pitch_mode = aubio_pitchm_cent;
242  else if (strcmp (pitch_unit, "bin") == 0)
243    pitch_mode = aubio_pitchm_bin;
244  else if (strcmp (pitch_unit, "default") == 0)
245    pitch_mode = aubio_pitchm_default;
246  else {
247    AUBIO_ERR ("unknown pitch detection unit %s, using default\n", pitch_unit);
248    pitch_mode = aubio_pitchm_default;
249  }
250  p->mode = pitch_mode;
251  switch (p->mode) {
252    case aubio_pitchm_freq:
253      p->conv_cb = freqconvpass;
254      break;
255    case aubio_pitchm_midi:
256      p->conv_cb = freqconvmidi;
257      break;
258    case aubio_pitchm_cent:
259      /* bug: not implemented */
260      p->conv_cb = freqconvmidi;
261      break;
262    case aubio_pitchm_bin:
263      p->conv_cb = freqconvbin;
264      break;
265    default:
266      break;
267  }
268  return AUBIO_OK;
269}
270
271uint_t
272aubio_pitch_set_tolerance (aubio_pitch_t * p, smpl_t tol)
273{
274  switch (p->type) {
275    case aubio_pitcht_yin:
276      aubio_pitchyin_set_tolerance (p->p_object, tol);
277      break;
278    case aubio_pitcht_yinfft:
279      aubio_pitchyinfft_set_tolerance (p->p_object, tol);
280      break;
281    default:
282      break;
283  }
284  return AUBIO_OK;
285}
286
287uint_t
288aubio_pitch_set_silence (aubio_pitch_t * p, smpl_t silence)
289{
290  if (silence < 0 && silence > -200) {
291    p->silence = silence;
292    return AUBIO_OK;
293  } else {
294    AUBIO_ERR("pitch: could do set silence to %.2f", silence);
295    return AUBIO_FAIL;
296  }
297}
298
299smpl_t
300aubio_pitch_get_silence (aubio_pitch_t * p)
301{
302  return p->silence;
303}
304
305
306/* do method, calling the detection callback, then the conversion callback */
307void
308aubio_pitch_do (aubio_pitch_t * p, fvec_t * ibuf, fvec_t * obuf)
309{
310  p->detect_cb (p, ibuf, obuf);
311  if (aubio_silence_detection(ibuf, p->silence) == 1) {
312    obuf->data[0] = 0.;
313  }
314  obuf->data[0] = p->conv_cb (obuf->data[0], p->samplerate, p->bufsize);
315}
316
317/* do method for each algorithm */
318void
319aubio_pitch_do_mcomb (aubio_pitch_t * p, fvec_t * ibuf, fvec_t * obuf)
320{
321  aubio_filter_do (p->filter, ibuf);
322  aubio_pvoc_do (p->pv, ibuf, p->fftgrain);
323  aubio_pitchmcomb_do (p->p_object, p->fftgrain, obuf);
324  obuf->data[0] = aubio_bintofreq (obuf->data[0], p->samplerate, p->bufsize);
325}
326
327void
328aubio_pitch_do_yin (aubio_pitch_t * p, fvec_t * ibuf, fvec_t * obuf)
329{
330  smpl_t pitch = 0.;
331  aubio_pitch_slideblock (p, ibuf);
332  aubio_pitchyin_do (p->p_object, p->buf, obuf);
333  pitch = obuf->data[0];
334  if (pitch > 0) {
335    pitch = p->samplerate / (pitch + 0.);
336  } else {
337    pitch = 0.;
338  }
339  obuf->data[0] = pitch;
340}
341
342
343void
344aubio_pitch_do_yinfft (aubio_pitch_t * p, fvec_t * ibuf, fvec_t * obuf)
345{
346  smpl_t pitch = 0.;
347  aubio_pitch_slideblock (p, ibuf);
348  aubio_pitchyinfft_do (p->p_object, p->buf, obuf);
349  pitch = obuf->data[0];
350  if (pitch > 0) {
351    pitch = p->samplerate / (pitch + 0.);
352  } else {
353    pitch = 0.;
354  }
355  obuf->data[0] = pitch;
356}
357
358void
359aubio_pitch_do_specacf (aubio_pitch_t * p, fvec_t * ibuf, fvec_t * out)
360{
361  aubio_pitch_slideblock (p, ibuf);
362  aubio_pitchspecacf_do (p->p_object, p->buf, out);
363  //out->data[0] = aubio_bintofreq (out->data[0], p->samplerate, p->bufsize);
364  smpl_t pitch = 0., period = out->data[0];
365  if (period > 0) {
366    pitch = p->samplerate / period;
367  } else {
368    pitch = 0.;
369  }
370  out->data[0] = pitch;
371}
372
373void
374aubio_pitch_do_fcomb (aubio_pitch_t * p, fvec_t * ibuf, fvec_t * out)
375{
376  aubio_pitch_slideblock (p, ibuf);
377  aubio_pitchfcomb_do (p->p_object, p->buf, out);
378  out->data[0] = aubio_bintofreq (out->data[0], p->samplerate, p->bufsize);
379}
380
381void
382aubio_pitch_do_schmitt (aubio_pitch_t * p, fvec_t * ibuf, fvec_t * out)
383{
384  smpl_t period, pitch = 0.;
385  aubio_pitch_slideblock (p, ibuf);
386  aubio_pitchschmitt_do (p->p_object, p->buf, out);
387  period = out->data[0];
388  if (period > 0) {
389    pitch = p->samplerate / period;
390  } else {
391    pitch = 0.;
392  }
393  out->data[0] = pitch;
394}
395
396/* conversion callbacks */
397smpl_t
398freqconvbin(smpl_t f, uint_t samplerate, uint_t bufsize)
399{
400  return aubio_freqtobin(f, samplerate, bufsize);
401}
402
403smpl_t
404freqconvmidi (smpl_t f, uint_t samplerate UNUSED, uint_t bufsize UNUSED)
405{
406  return aubio_freqtomidi (f);
407}
408
409smpl_t
410freqconvpass (smpl_t f, uint_t samplerate UNUSED, uint_t bufsize UNUSED)
411{
412  return f;
413}
414
415/* confidence callbacks */
416smpl_t
417aubio_pitch_get_confidence (aubio_pitch_t * p)
418{
419  if (p->conf_cb) {
420    return p->conf_cb(p->p_object);
421  }
422  return 0.;
423}
Note: See TracBrowser for help on using the repository browser.