source: src/pitch/pitch.c @ 5a2a6c6

feature/autosinkfeature/cnnfeature/cnn_orgfeature/constantqfeature/crepefeature/crepe_orgfeature/pitchshiftfeature/pydocstringsfeature/timestretchfix/ffmpeg5pitchshiftsamplertimestretchyinfft+
Last change on this file since 5a2a6c6 was 5a2a6c6, checked in by Paul Brossier <piem@piem.org>, 10 years ago

src/pitch/pitch.c: add Hertz as valid unit string

  • Property mode set to 100644
File size: 12.9 KB
RevLine 
[96fb8ad]1/*
[e6a78ea]2  Copyright (C) 2003-2009 Paul Brossier <piem@aubio.org>
3
4  This file is part of aubio.
5
6  aubio is free software: you can redistribute it and/or modify
7  it under the terms of the GNU General Public License as published by
8  the Free Software Foundation, either version 3 of the License, or
9  (at your option) any later version.
10
11  aubio is distributed in the hope that it will be useful,
12  but WITHOUT ANY WARRANTY; without even the implied warranty of
13  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
14  GNU General Public License for more details.
15
16  You should have received a copy of the GNU General Public License
17  along with aubio.  If not, see <http://www.gnu.org/licenses/>.
18
19*/
[96fb8ad]20
21#include "aubio_priv.h"
[6c7d49b]22#include "fvec.h"
23#include "cvec.h"
[a4364b8]24#include "lvec.h"
[96fb8ad]25#include "mathutils.h"
[83963b3]26#include "musicutils.h"
27#include "spectral/phasevoc.h"
[a695854]28#include "temporal/filter.h"
[c159aeb]29#include "temporal/c_weighting.h"
[2d8cffa]30#include "pitch/pitchmcomb.h"
31#include "pitch/pitchyin.h"
32#include "pitch/pitchfcomb.h"
33#include "pitch/pitchschmitt.h"
34#include "pitch/pitchyinfft.h"
[95dc7f2]35#include "pitch/pitchspecacf.h"
[ca1abdd]36#include "pitch/pitch.h"
[96fb8ad]37
[8c3f717]38#define DEFAULT_PITCH_SILENCE -50.
39
[a64ef1d]40/** pitch detection algorithms */
[fddfa64]41typedef enum
42{
[a64ef1d]43  aubio_pitcht_yin,        /**< `yin`, YIN algorithm */
44  aubio_pitcht_mcomb,      /**< `mcomb`, Multi-comb filter */
45  aubio_pitcht_schmitt,    /**< `schmitt`, Schmitt trigger */
46  aubio_pitcht_fcomb,      /**< `fcomb`, Fast comb filter */
47  aubio_pitcht_yinfft,     /**< `yinfft`, Spectral YIN */
[95dc7f2]48  aubio_pitcht_specacf,    /**< `specacf`, Spectral autocorrelation */
[a64ef1d]49  aubio_pitcht_default
50    = aubio_pitcht_yinfft, /**< `default` */
[ca1abdd]51} aubio_pitch_type;
[fe163ad]52
[a64ef1d]53/** pitch detection output modes */
[fddfa64]54typedef enum
55{
[fe163ad]56  aubio_pitchm_freq,   /**< Frequency (Hz) */
57  aubio_pitchm_midi,   /**< MIDI note (0.,127) */
58  aubio_pitchm_cent,   /**< Cent */
59  aubio_pitchm_bin,    /**< Frequency bin (0,bufsize) */
60  aubio_pitchm_default = aubio_pitchm_freq, /**< the one used when "default" is asked */
[ca1abdd]61} aubio_pitch_mode;
[fe163ad]62
[b130600]63/** callback to get pitch candidate, defined below */
64typedef void (*aubio_pitch_detect_t) (aubio_pitch_t * p, fvec_t * ibuf, fvec_t * obuf);
[6d4ec49]65
[b130600]66/** callback to convert pitch from one unit to another, defined below */
67typedef smpl_t(*aubio_pitch_convert_t) (smpl_t value, uint_t samplerate, uint_t bufsize);
[5284e0d]68
[b130600]69/** callback to fetch the confidence of the algorithm */
70typedef smpl_t (*aubio_pitch_get_conf_t) (void * p);
[f44b111]71
[475da2f]72/** generic pitch detection structure */
[fddfa64]73struct _aubio_pitch_t
74{
[b130600]75  aubio_pitch_type type;          /**< pitch detection mode */
76  aubio_pitch_mode mode;          /**< pitch detection output mode */
77  uint_t samplerate;              /**< samplerate */
[475da2f]78  uint_t bufsize;                 /**< buffer size */
[b130600]79  void *p_object;                 /**< pointer to pitch object */
[fddfa64]80  aubio_filter_t *filter;         /**< filter */
81  aubio_pvoc_t *pv;               /**< phase vocoder for mcomb */
82  cvec_t *fftgrain;               /**< spectral frame for mcomb */
83  fvec_t *buf;                    /**< temporary buffer for yin */
[b130600]84  aubio_pitch_detect_t detect_cb; /**< callback to get the pitch candidates */
85  aubio_pitch_convert_t conv_cb;  /**< callback to convert it to the desired unit */
86  aubio_pitch_get_conf_t conf_cb; /**< pointer to the current confidence callback */
[8c3f717]87  smpl_t silence;                 /**< silence threshold */
[96fb8ad]88};
89
[b130600]90/* callback functions for pitch detection */
91static void aubio_pitch_do_mcomb (aubio_pitch_t * p, fvec_t * ibuf, fvec_t * obuf);
92static void aubio_pitch_do_yin (aubio_pitch_t * p, fvec_t * ibuf, fvec_t * obuf);
93static void aubio_pitch_do_schmitt (aubio_pitch_t * p, fvec_t * ibuf, fvec_t * obuf);
94static void aubio_pitch_do_fcomb (aubio_pitch_t * p, fvec_t * ibuf, fvec_t * obuf);
95static void aubio_pitch_do_yinfft (aubio_pitch_t * p, fvec_t * ibuf, fvec_t * obuf);
[95dc7f2]96static void aubio_pitch_do_specacf (aubio_pitch_t * p, fvec_t * ibuf, fvec_t * obuf);
[3ec9d9c]97
[b130600]98/* conversion functions for frequency conversions */
99smpl_t freqconvbin (smpl_t f, uint_t samplerate, uint_t bufsize);
100smpl_t freqconvmidi (smpl_t f, uint_t samplerate, uint_t bufsize);
101smpl_t freqconvpass (smpl_t f, uint_t samplerate, uint_t bufsize);
102
103/* adapter to stack ibuf new samples at the end of buf, and trim `buf` to `bufsize` */
104void aubio_pitch_slideblock (aubio_pitch_t * p, fvec_t * ibuf);
[3ec9d9c]105
106
[ca1abdd]107aubio_pitch_t *
108new_aubio_pitch (char_t * pitch_mode,
[168337e]109    uint_t bufsize, uint_t hopsize, uint_t samplerate)
[96fb8ad]110{
[fddfa64]111  aubio_pitch_t *p = AUBIO_NEW (aubio_pitch_t);
[ca1abdd]112  aubio_pitch_type pitch_type;
[fe163ad]113  if (strcmp (pitch_mode, "mcomb") == 0)
[fddfa64]114    pitch_type = aubio_pitcht_mcomb;
[fe163ad]115  else if (strcmp (pitch_mode, "yinfft") == 0)
[97a5878b]116    pitch_type = aubio_pitcht_yinfft;
[fe163ad]117  else if (strcmp (pitch_mode, "yin") == 0)
[fddfa64]118    pitch_type = aubio_pitcht_yin;
[fe163ad]119  else if (strcmp (pitch_mode, "schmitt") == 0)
[fddfa64]120    pitch_type = aubio_pitcht_schmitt;
[fe163ad]121  else if (strcmp (pitch_mode, "fcomb") == 0)
[fddfa64]122    pitch_type = aubio_pitcht_fcomb;
[95dc7f2]123  else if (strcmp (pitch_mode, "specacf") == 0)
124    pitch_type = aubio_pitcht_specacf;
[fe163ad]125  else if (strcmp (pitch_mode, "default") == 0)
[fddfa64]126    pitch_type = aubio_pitcht_default;
[fe163ad]127  else {
[fddfa64]128    AUBIO_ERR ("unknown pitch detection method %s, using default.\n",
129        pitch_mode);
130    pitch_type = aubio_pitcht_default;
[fe163ad]131  }
[b130600]132  p->samplerate = samplerate;
[fe163ad]133  p->type = pitch_type;
[ca1abdd]134  aubio_pitch_set_unit (p, "default");
[6d4ec49]135  p->bufsize = bufsize;
[8c3f717]136  p->silence = DEFAULT_PITCH_SILENCE;
[b130600]137  p->conf_cb = NULL;
[fddfa64]138  switch (p->type) {
[ca1abdd]139    case aubio_pitcht_yin:
[168337e]140      p->buf = new_fvec (bufsize);
[b130600]141      p->p_object = new_aubio_pitchyin (bufsize);
142      p->detect_cb = aubio_pitch_do_yin;
143      p->conf_cb = (aubio_pitch_get_conf_t)aubio_pitchyin_get_confidence;
144      aubio_pitchyin_set_tolerance (p->p_object, 0.15);
[6d4ec49]145      break;
[ca1abdd]146    case aubio_pitcht_mcomb:
[168337e]147      p->pv = new_aubio_pvoc (bufsize, hopsize);
148      p->fftgrain = new_cvec (bufsize);
[b130600]149      p->p_object = new_aubio_pitchmcomb (bufsize, hopsize);
[168337e]150      p->filter = new_aubio_filter_c_weighting (samplerate);
[b130600]151      p->detect_cb = aubio_pitch_do_mcomb;
[6d4ec49]152      break;
[ca1abdd]153    case aubio_pitcht_fcomb:
[168337e]154      p->buf = new_fvec (bufsize);
[b130600]155      p->p_object = new_aubio_pitchfcomb (bufsize, hopsize);
156      p->detect_cb = aubio_pitch_do_fcomb;
[6d4ec49]157      break;
[ca1abdd]158    case aubio_pitcht_schmitt:
[168337e]159      p->buf = new_fvec (bufsize);
[b130600]160      p->p_object = new_aubio_pitchschmitt (bufsize);
161      p->detect_cb = aubio_pitch_do_schmitt;
[6d4ec49]162      break;
[ca1abdd]163    case aubio_pitcht_yinfft:
[168337e]164      p->buf = new_fvec (bufsize);
[9c9202f]165      p->p_object = new_aubio_pitchyinfft (samplerate, bufsize);
[b130600]166      p->detect_cb = aubio_pitch_do_yinfft;
167      p->conf_cb = (aubio_pitch_get_conf_t)aubio_pitchyinfft_get_confidence;
168      aubio_pitchyinfft_set_tolerance (p->p_object, 0.85);
[6d4ec49]169      break;
[95dc7f2]170    case aubio_pitcht_specacf:
171      p->buf = new_fvec (bufsize);
172      p->p_object = new_aubio_pitchspecacf (bufsize);
173      p->detect_cb = aubio_pitch_do_specacf;
174      p->conf_cb = (aubio_pitch_get_conf_t)aubio_pitchspecacf_get_tolerance;
175      aubio_pitchspecacf_set_tolerance (p->p_object, 0.85);
176      break;
[6d4ec49]177    default:
178      break;
179  }
180  return p;
[96fb8ad]181}
182
[fddfa64]183void
184del_aubio_pitch (aubio_pitch_t * p)
185{
186  switch (p->type) {
[ca1abdd]187    case aubio_pitcht_yin:
[fddfa64]188      del_fvec (p->buf);
[b130600]189      del_aubio_pitchyin (p->p_object);
[6d4ec49]190      break;
[ca1abdd]191    case aubio_pitcht_mcomb:
[fddfa64]192      del_aubio_pvoc (p->pv);
193      del_cvec (p->fftgrain);
194      del_aubio_filter (p->filter);
[b130600]195      del_aubio_pitchmcomb (p->p_object);
[6d4ec49]196      break;
[ca1abdd]197    case aubio_pitcht_schmitt:
[fddfa64]198      del_fvec (p->buf);
[b130600]199      del_aubio_pitchschmitt (p->p_object);
[6d4ec49]200      break;
[ca1abdd]201    case aubio_pitcht_fcomb:
[fddfa64]202      del_fvec (p->buf);
[b130600]203      del_aubio_pitchfcomb (p->p_object);
[6d4ec49]204      break;
[ca1abdd]205    case aubio_pitcht_yinfft:
[fddfa64]206      del_fvec (p->buf);
[b130600]207      del_aubio_pitchyinfft (p->p_object);
[6d4ec49]208      break;
[95dc7f2]209    case aubio_pitcht_specacf:
210      del_fvec (p->buf);
211      del_aubio_pitchspecacf (p->p_object);
212      break;
[6d4ec49]213    default:
214      break;
215  }
[fddfa64]216  AUBIO_FREE (p);
[96fb8ad]217}
218
[fddfa64]219void
220aubio_pitch_slideblock (aubio_pitch_t * p, fvec_t * ibuf)
221{
[168337e]222  uint_t j = 0, overlap_size = 0;
[fddfa64]223  overlap_size = p->buf->length - ibuf->length;
[168337e]224  for (j = 0; j < overlap_size; j++) {
225    p->buf->data[j] = p->buf->data[j + ibuf->length];
[6d4ec49]226  }
[168337e]227  for (j = 0; j < ibuf->length; j++) {
228    p->buf->data[j + overlap_size] = ibuf->data[j];
[6d4ec49]229  }
[651b97e]230}
231
[fddfa64]232uint_t
233aubio_pitch_set_unit (aubio_pitch_t * p, char_t * pitch_unit)
234{
[21e2e6db]235  uint_t err = AUBIO_OK;
[ca1abdd]236  aubio_pitch_mode pitch_mode;
[fe163ad]237  if (strcmp (pitch_unit, "freq") == 0)
[fddfa64]238    pitch_mode = aubio_pitchm_freq;
[53d1497]239  else if (strcmp (pitch_unit, "hertz") == 0)
240    pitch_mode = aubio_pitchm_freq;
[5a2a6c6]241  else if (strcmp (pitch_unit, "Hertz") == 0)
242    pitch_mode = aubio_pitchm_freq;
[53d1497]243  else if (strcmp (pitch_unit, "Hz") == 0)
244    pitch_mode = aubio_pitchm_freq;
245  else if (strcmp (pitch_unit, "f0") == 0)
246    pitch_mode = aubio_pitchm_freq;
[fe163ad]247  else if (strcmp (pitch_unit, "midi") == 0)
[fddfa64]248    pitch_mode = aubio_pitchm_midi;
[fe163ad]249  else if (strcmp (pitch_unit, "cent") == 0)
[fddfa64]250    pitch_mode = aubio_pitchm_cent;
[fe163ad]251  else if (strcmp (pitch_unit, "bin") == 0)
[fddfa64]252    pitch_mode = aubio_pitchm_bin;
[fe163ad]253  else if (strcmp (pitch_unit, "default") == 0)
[fddfa64]254    pitch_mode = aubio_pitchm_default;
[fe163ad]255  else {
[fddfa64]256    AUBIO_ERR ("unknown pitch detection unit %s, using default\n", pitch_unit);
257    pitch_mode = aubio_pitchm_default;
[21e2e6db]258    err = AUBIO_FAIL;
[fe163ad]259  }
260  p->mode = pitch_mode;
[fddfa64]261  switch (p->mode) {
[fe163ad]262    case aubio_pitchm_freq:
[b130600]263      p->conv_cb = freqconvpass;
[fe163ad]264      break;
265    case aubio_pitchm_midi:
[b130600]266      p->conv_cb = freqconvmidi;
[fe163ad]267      break;
268    case aubio_pitchm_cent:
269      /* bug: not implemented */
[b130600]270      p->conv_cb = freqconvmidi;
[fe163ad]271      break;
272    case aubio_pitchm_bin:
[b130600]273      p->conv_cb = freqconvbin;
[fe163ad]274      break;
275    default:
276      break;
277  }
[21e2e6db]278  return err;
[fe163ad]279}
280
[fddfa64]281uint_t
282aubio_pitch_set_tolerance (aubio_pitch_t * p, smpl_t tol)
283{
284  switch (p->type) {
[ca1abdd]285    case aubio_pitcht_yin:
[b130600]286      aubio_pitchyin_set_tolerance (p->p_object, tol);
[7a6cbbe]287      break;
[ca1abdd]288    case aubio_pitcht_yinfft:
[b130600]289      aubio_pitchyinfft_set_tolerance (p->p_object, tol);
[7a6cbbe]290      break;
291    default:
292      break;
293  }
[93177fa]294  return AUBIO_OK;
[f8a38c5]295}
296
[8c3f717]297uint_t
298aubio_pitch_set_silence (aubio_pitch_t * p, smpl_t silence)
299{
300  if (silence < 0 && silence > -200) {
301    p->silence = silence;
302    return AUBIO_OK;
303  } else {
304    AUBIO_ERR("pitch: could do set silence to %.2f", silence);
305    return AUBIO_FAIL;
306  }
307}
308
309smpl_t
310aubio_pitch_get_silence (aubio_pitch_t * p)
311{
312  return p->silence;
313}
314
[b130600]315
316/* do method, calling the detection callback, then the conversion callback */
[fddfa64]317void
318aubio_pitch_do (aubio_pitch_t * p, fvec_t * ibuf, fvec_t * obuf)
319{
[b130600]320  p->detect_cb (p, ibuf, obuf);
[8c3f717]321  if (aubio_silence_detection(ibuf, p->silence) == 1) {
322    obuf->data[0] = 0.;
323  }
[b130600]324  obuf->data[0] = p->conv_cb (obuf->data[0], p->samplerate, p->bufsize);
[c078336]325}
326
[b130600]327/* do method for each algorithm */
[fddfa64]328void
329aubio_pitch_do_mcomb (aubio_pitch_t * p, fvec_t * ibuf, fvec_t * obuf)
330{
331  aubio_filter_do (p->filter, ibuf);
332  aubio_pvoc_do (p->pv, ibuf, p->fftgrain);
[b130600]333  aubio_pitchmcomb_do (p->p_object, p->fftgrain, obuf);
334  obuf->data[0] = aubio_bintofreq (obuf->data[0], p->samplerate, p->bufsize);
[c078336]335}
336
[fddfa64]337void
338aubio_pitch_do_yin (aubio_pitch_t * p, fvec_t * ibuf, fvec_t * obuf)
339{
[6d4ec49]340  smpl_t pitch = 0.;
[fddfa64]341  aubio_pitch_slideblock (p, ibuf);
[b130600]342  aubio_pitchyin_do (p->p_object, p->buf, obuf);
[168337e]343  pitch = obuf->data[0];
344  if (pitch > 0) {
[b130600]345    pitch = p->samplerate / (pitch + 0.);
[168337e]346  } else {
347    pitch = 0.;
[6d4ec49]348  }
[168337e]349  obuf->data[0] = pitch;
[c078336]350}
351
352
[fddfa64]353void
354aubio_pitch_do_yinfft (aubio_pitch_t * p, fvec_t * ibuf, fvec_t * obuf)
355{
[6d4ec49]356  smpl_t pitch = 0.;
[fddfa64]357  aubio_pitch_slideblock (p, ibuf);
[b130600]358  aubio_pitchyinfft_do (p->p_object, p->buf, obuf);
[168337e]359  pitch = obuf->data[0];
360  if (pitch > 0) {
[b130600]361    pitch = p->samplerate / (pitch + 0.);
[168337e]362  } else {
363    pitch = 0.;
[6d4ec49]364  }
[168337e]365  obuf->data[0] = pitch;
[650e39b]366}
367
[fddfa64]368void
[95dc7f2]369aubio_pitch_do_specacf (aubio_pitch_t * p, fvec_t * ibuf, fvec_t * out)
370{
[c21acb9]371  smpl_t pitch = 0., period;
[95dc7f2]372  aubio_pitch_slideblock (p, ibuf);
373  aubio_pitchspecacf_do (p->p_object, p->buf, out);
374  //out->data[0] = aubio_bintofreq (out->data[0], p->samplerate, p->bufsize);
[c21acb9]375  period = out->data[0];
[95dc7f2]376  if (period > 0) {
377    pitch = p->samplerate / period;
378  } else {
379    pitch = 0.;
380  }
381  out->data[0] = pitch;
382}
383
384void
[fddfa64]385aubio_pitch_do_fcomb (aubio_pitch_t * p, fvec_t * ibuf, fvec_t * out)
386{
387  aubio_pitch_slideblock (p, ibuf);
[b130600]388  aubio_pitchfcomb_do (p->p_object, p->buf, out);
389  out->data[0] = aubio_bintofreq (out->data[0], p->samplerate, p->bufsize);
[c078336]390}
391
[fddfa64]392void
393aubio_pitch_do_schmitt (aubio_pitch_t * p, fvec_t * ibuf, fvec_t * out)
394{
[7a6cbbe]395  smpl_t period, pitch = 0.;
[fddfa64]396  aubio_pitch_slideblock (p, ibuf);
[b130600]397  aubio_pitchschmitt_do (p->p_object, p->buf, out);
[168337e]398  period = out->data[0];
399  if (period > 0) {
[b130600]400    pitch = p->samplerate / period;
[168337e]401  } else {
402    pitch = 0.;
[7a6cbbe]403  }
[168337e]404  out->data[0] = pitch;
[96fb8ad]405}
[5284e0d]406
[b130600]407/* conversion callbacks */
408smpl_t
409freqconvbin(smpl_t f, uint_t samplerate, uint_t bufsize)
410{
411  return aubio_freqtobin(f, samplerate, bufsize);
412}
413
414smpl_t
415freqconvmidi (smpl_t f, uint_t samplerate UNUSED, uint_t bufsize UNUSED)
416{
417  return aubio_freqtomidi (f);
418}
419
420smpl_t
421freqconvpass (smpl_t f, uint_t samplerate UNUSED, uint_t bufsize UNUSED)
422{
423  return f;
424}
425
[5284e0d]426/* confidence callbacks */
427smpl_t
428aubio_pitch_get_confidence (aubio_pitch_t * p)
429{
[b130600]430  if (p->conf_cb) {
431    return p->conf_cb(p->p_object);
[5284e0d]432  }
433  return 0.;
434}
Note: See TracBrowser for help on using the repository browser.