source: src/pitch/pitchmcomb.c @ 36b5f94

feature/autosinkfeature/cnnfeature/cnn_orgfeature/constantqfeature/crepefeature/crepe_orgfeature/pitchshiftfeature/pydocstringsfeature/timestretchfix/ffmpeg5pitchshiftsamplertimestretchyinfft+
Last change on this file since 36b5f94 was fddfa64, checked in by Paul Brossier <piem@piem.org>, 15 years ago

src/pitch/: indent

  • Property mode set to 100644
File size: 14.6 KB
RevLine 
[96fb8ad]1/*
[e6a78ea]2  Copyright (C) 2003-2009 Paul Brossier <piem@aubio.org>
[96fb8ad]3
[e6a78ea]4  This file is part of aubio.
[96fb8ad]5
[e6a78ea]6  aubio is free software: you can redistribute it and/or modify
7  it under the terms of the GNU General Public License as published by
8  the Free Software Foundation, either version 3 of the License, or
9  (at your option) any later version.
[96fb8ad]10
[e6a78ea]11  aubio is distributed in the hope that it will be useful,
12  but WITHOUT ANY WARRANTY; without even the implied warranty of
13  MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
14  GNU General Public License for more details.
15
16  You should have received a copy of the GNU General Public License
17  along with aubio.  If not, see <http://www.gnu.org/licenses/>.
[96fb8ad]18
19*/
20
21#include "aubio_priv.h"
[6c7d49b]22#include "fvec.h"
23#include "cvec.h"
[96fb8ad]24#include "mathutils.h"
[2d8cffa]25#include "pitch/pitchmcomb.h"
[96fb8ad]26
27#define CAND_SWAP(a,b) { register aubio_spectralcandidate_t *t=(a);(a)=(b);(b)=t; }
28
29typedef struct _aubio_spectralpeak_t aubio_spectralpeak_t;
30typedef struct _aubio_spectralcandidate_t aubio_spectralcandidate_t;
[fddfa64]31uint_t aubio_pitchmcomb_get_root_peak (aubio_spectralpeak_t * peaks,
32    uint_t length);
33uint_t aubio_pitchmcomb_quadpick (aubio_spectralpeak_t * spectral_peaks,
34    fvec_t * X);
35void aubio_pitchmcomb_spectral_pp (aubio_pitchmcomb_t * p, fvec_t * oldmag);
36void aubio_pitchmcomb_combdet (aubio_pitchmcomb_t * p, fvec_t * newmag);
[96fb8ad]37/* not used but useful : sort by amplitudes (or anything else)
38 * sort_pitchpeak(peaks, length);
39 */
40/** spectral_peak comparison function (must return signed int) */
[fddfa64]41static sint_t aubio_pitchmcomb_sort_peak_comp (const void *x, const void *y);
[96fb8ad]42/** sort spectral_peak against their mag */
[fddfa64]43void aubio_pitchmcomb_sort_peak (aubio_spectralpeak_t * peaks, uint_t nbins);
[9a12264]44/** select the best candidates */
[fddfa64]45uint_t aubio_pitch_cands (aubio_pitchmcomb_t * p, cvec_t * fftgrain,
46    smpl_t * cands);
[96fb8ad]47
48/** sort spectral_candidate against their comb ene */
[fddfa64]49void aubio_pitchmcomb_sort_cand_ene (aubio_spectralcandidate_t ** candidates,
50    uint_t nbins);
[96fb8ad]51/** sort spectral_candidate against their frequency */
[fddfa64]52void aubio_pitchmcomb_sort_cand_freq (aubio_spectralcandidate_t ** candidates,
53    uint_t nbins);
[96fb8ad]54
[fddfa64]55struct _aubio_pitchmcomb_t
56{
[96fb8ad]57  smpl_t threshold;                        /**< offset threshold [0.033 or 0.01]     */
58  smpl_t alpha;                            /**< normalisation exponent [9]           */
59  smpl_t cutoff;                           /**< low-pass filter cutoff [0.34, 1]     */
60  smpl_t tol;                              /**< tolerance [0.05]                     */
[e5757cf]61  // smpl_t tau;                              /**< frequency precision [44100/4096]     */
[96fb8ad]62  uint_t win_post;                         /**< median filter window length          */
63  uint_t win_pre;                          /**< median filter window                 */
64  uint_t ncand;                            /**< maximum number of candidates (combs) */
65  uint_t npartials;                        /**< maximum number of partials per combs */
66  uint_t count;                            /**< picked picks                         */
67  uint_t goodcandidate;                    /**< best candidate                       */
68  uint_t spec_partition;                   /**< spectrum partition to consider       */
[fddfa64]69  aubio_spectralpeak_t *peaks;             /**< up to length win/spec_partition      */
70  aubio_spectralcandidate_t **candidates;  /** up to five candidates                 */
[96fb8ad]71  /* some scratch pads */
72  /** \bug  (unnecessary copied from fftgrain?) */
[fddfa64]73  fvec_t *newmag;                          /**< vec to store mag                     */
74  fvec_t *scratch;                         /**< vec to store modified mag            */
75  fvec_t *scratch2;                        /**< vec to compute moving median         */
76  fvec_t *theta;                          /**< vec to store phase                     */
[d94f98b]77  smpl_t phasediff;
78  smpl_t phasefreq;
[96fb8ad]79  /** threshfn: name or handle of fn for computing adaptive threshold [median] */
80  /** aubio_thresholdfn_t thresholdfn; */
81  /** picker: name or handle of fn for picking event times [quadpick] */
82  /** aubio_pickerfn_t pickerfn; */
83};
84
85/** spectral peak object */
[fddfa64]86struct _aubio_spectralpeak_t
87{
[96fb8ad]88  uint_t bin;     /**< bin [0-(length-1)] */
89  smpl_t ebin;    /**< estimated bin */
90  smpl_t mag;     /**< peak magnitude */
91};
92
93/** spectral candidates array object */
[fddfa64]94struct _aubio_spectralcandidate_t
95{
[96fb8ad]96  smpl_t ebin;    /**< interpolated bin */
[fddfa64]97  smpl_t *ecomb;  /**< comb */
[96fb8ad]98  smpl_t ene;     /**< candidate energy */
99  smpl_t len;     /**< length */
100};
101
102
[fddfa64]103void
104aubio_pitchmcomb_do (aubio_pitchmcomb_t * p, cvec_t * fftgrain, fvec_t * output)
105{
106  uint_t i, j;
[d94f98b]107  smpl_t instfreq;
[fddfa64]108  fvec_t *newmag = (fvec_t *) p->newmag;
[96fb8ad]109  //smpl_t hfc; //fe=instfreq(theta1,theta,ops); //theta1=theta;
110  /* copy incoming grain to newmag */
[fddfa64]111  for (i = 0; i < fftgrain->channels; i++) {
112    for (j = 0; j < newmag->length; j++)
113      newmag->data[0][j] = fftgrain->norm[i][j];
114    /* detect only if local energy > 10. */
115    //if (fvec_local_energy(newmag)>10.) {
[5c4ec3c]116    //hfc = fvec_local_hfc(newmag); //not used
[fddfa64]117    aubio_pitchmcomb_spectral_pp (p, newmag);
118    aubio_pitchmcomb_combdet (p, newmag);
[d8604ac]119    //aubio_pitchmcomb_sort_cand_freq(p->candidates,p->ncand);
[d94f98b]120    //return p->candidates[p->goodcandidate]->ebin;
[fddfa64]121    j = (uint_t) FLOOR (p->candidates[p->goodcandidate]->ebin + .5);
122    instfreq = aubio_unwrap2pi (fftgrain->phas[i][j]
123        - p->theta->data[i][j] - j * p->phasediff);
124    instfreq *= p->phasefreq;
125    /* store phase for next run */
126    for (j = 0; j < p->theta->length; j++) {
127      p->theta->data[i][j] = fftgrain->phas[i][j];
128    }
129    //return p->candidates[p->goodcandidate]->ebin;
130    output->data[i][0] =
131        FLOOR (p->candidates[p->goodcandidate]->ebin + .5) + instfreq;
132    /*} else {
133       return -1.;
134       } */
[e5757cf]135  }
[96fb8ad]136}
137
[fddfa64]138uint_t
139aubio_pitch_cands (aubio_pitchmcomb_t * p, cvec_t * fftgrain, smpl_t * cands)
140{
141  uint_t i = 0, j;
[96fb8ad]142  uint_t k;
[fddfa64]143  fvec_t *newmag = (fvec_t *) p->newmag;
144  aubio_spectralcandidate_t **scands =
145      (aubio_spectralcandidate_t **) (p->candidates);
[96fb8ad]146  //smpl_t hfc; //fe=instfreq(theta1,theta,ops); //theta1=theta;
147  /* copy incoming grain to newmag */
[fddfa64]148  for (j = 0; j < newmag->length; j++)
149    newmag->data[i][j] = fftgrain->norm[i][j];
[b050e8e]150  /* detect only if local energy > 10. */
[fddfa64]151  if (fvec_local_energy (newmag) > 10.) {
[5c4ec3c]152    /* hfc = fvec_local_hfc(newmag); do not use */
[fddfa64]153    aubio_pitchmcomb_spectral_pp (p, newmag);
154    aubio_pitchmcomb_combdet (p, newmag);
155    aubio_pitchmcomb_sort_cand_freq (scands, p->ncand);
[b050e8e]156    /* store ncand comb energies in cands[1:ncand] */
[fddfa64]157    for (k = 0; k < p->ncand; k++)
[96fb8ad]158      cands[k] = p->candidates[k]->ene;
[b050e8e]159    /* store ncand[end] freq in cands[end] */
[fddfa64]160    cands[p->ncand] = p->candidates[p->ncand - 1]->ebin;
[96fb8ad]161    return 1;
162  } else {
[fddfa64]163    for (k = 0; k < p->ncand; k++)
[96fb8ad]164      cands[k] = 0;
165    return 0;
166  }
167}
168
[fddfa64]169void
170aubio_pitchmcomb_spectral_pp (aubio_pitchmcomb_t * p, fvec_t * newmag)
171{
172  fvec_t *mag = (fvec_t *) p->scratch;
173  fvec_t *tmp = (fvec_t *) p->scratch2;
174  uint_t i = 0, j;
[96fb8ad]175  uint_t length = mag->length;
176  /* copy newmag to mag (scracth) */
[fddfa64]177  for (j = 0; j < length; j++) {
[b050e8e]178    mag->data[i][j] = newmag->data[i][j];
[96fb8ad]179  }
[fddfa64]180  fvec_min_removal (mag);       /* min removal          */
181  fvec_alpha_normalise (mag, p->alpha); /* alpha normalisation  */
182  /* skipped *//* low pass filtering   */
[5c4ec3c]183  /** \bug fvec_moving_thres may write out of bounds */
[fddfa64]184  fvec_adapt_thres (mag, tmp, p->win_post, p->win_pre, i);      /* adaptative threshold */
185  fvec_add (mag, -p->threshold);        /* fixed threshold      */
[96fb8ad]186  {
[fddfa64]187    aubio_spectralpeak_t *peaks = (aubio_spectralpeak_t *) p->peaks;
[96fb8ad]188    uint_t count;
189    /*  return bin and ebin */
[fddfa64]190    count = aubio_pitchmcomb_quadpick (peaks, mag);
191    for (j = 0; j < count; j++)
[96fb8ad]192      peaks[j].mag = newmag->data[i][peaks[j].bin];
193    /* reset non peaks */
[fddfa64]194    for (j = count; j < length; j++)
[96fb8ad]195      peaks[j].mag = 0.;
196    p->peaks = peaks;
197    p->count = count;
198  }
199}
200
[fddfa64]201void
202aubio_pitchmcomb_combdet (aubio_pitchmcomb_t * p, fvec_t * newmag)
203{
204  aubio_spectralpeak_t *peaks = (aubio_spectralpeak_t *) p->peaks;
205  aubio_spectralcandidate_t **candidate =
206      (aubio_spectralcandidate_t **) p->candidates;
[96fb8ad]207
208  /* parms */
[fddfa64]209  uint_t N = p->npartials;      /* maximum number of partials to be considered 10 */
210  uint_t M = p->ncand;          /* maximum number of combs to be considered 5 */
[96fb8ad]211  uint_t length = newmag->length;
212  uint_t count = p->count;
213  uint_t k;
214  uint_t l;
215  uint_t d;
[9638f84]216  uint_t curlen = 0;
[96fb8ad]217
218  smpl_t delta2;
219  smpl_t xx;
220  uint_t position = 0;
221
222  uint_t root_peak = 0;
223  uint_t tmpl = 0;
224  smpl_t tmpene = 0.;
225
226  /* get the biggest peak in the spectrum */
[fddfa64]227  root_peak = aubio_pitchmcomb_get_root_peak (peaks, count);
[e47ade3]228  /* not enough partials in highest notes, could be forced */
229  //if (peaks[root_peak].ebin >= aubio_miditofreq(85.)/p->tau) N=2;
230  //if (peaks[root_peak].ebin >= aubio_miditofreq(90.)/p->tau) N=1;
[96fb8ad]231  /* now calculate the energy of each of the 5 combs */
[fddfa64]232  for (l = 0; l < M; l++) {
233    smpl_t scaler = (1. / (l + 1.));
234    candidate[l]->ene = 0.;     /* reset ene and len sums */
[96fb8ad]235    candidate[l]->len = 0.;
[fddfa64]236    candidate[l]->ebin = scaler * peaks[root_peak].ebin;
[96fb8ad]237    /* if less than N peaks available, curlen < N */
[9638f84]238    if (candidate[l]->ebin != 0.)
[fddfa64]239      curlen = (uint_t) FLOOR (length / (candidate[l]->ebin));
240    curlen = (N < curlen) ? N : curlen;
[96fb8ad]241    /* fill candidate[l]->ecomb[k] with (k+1)*candidate[l]->ebin */
[fddfa64]242    for (k = 0; k < curlen; k++)
243      candidate[l]->ecomb[k] = (candidate[l]->ebin) * (k + 1.);
244    for (k = curlen; k < length; k++)
245      candidate[l]->ecomb[k] = 0.;
[96fb8ad]246    /* for each in candidate[l]->ecomb[k] */
[fddfa64]247    for (k = 0; k < curlen; k++) {
[d8604ac]248      xx = 100000.;
[b050e8e]249      /** get the candidate->ecomb the closer to peaks.ebin
[96fb8ad]250       * (to cope with the inharmonicity)*/
[fddfa64]251      for (d = 0; d < count; d++) {
252        delta2 = ABS (candidate[l]->ecomb[k] - peaks[d].ebin);
[96fb8ad]253        if (delta2 <= xx) {
254          position = d;
255          xx = delta2;
256        }
257      }
[b050e8e]258      /* for a Q factor of 17, maintaining "constant Q filtering",
[96fb8ad]259       * and sum energy and length over non null combs */
[fddfa64]260      if (17. * xx < candidate[l]->ecomb[k]) {
261        candidate[l]->ecomb[k] = peaks[position].ebin;
262        candidate[l]->ene +=    /* ecomb rounded to nearest int */
263            POW (newmag->data[0][(uint_t) FLOOR (candidate[l]->ecomb[k] + .5)],
264            0.25);
265        candidate[l]->len += 1. / curlen;
[96fb8ad]266      } else
[fddfa64]267        candidate[l]->ecomb[k] = 0.;
[96fb8ad]268    }
269    /* punishment */
[d94f98b]270    /*if (candidate[l]->len<0.6)
[fddfa64]271       candidate[l]->ene=0.; */
[d94f98b]272    /* remember best candidate energy (in polyphonic, could check for
273     * tmpene*1.1 < candidate->ene to reduce jumps towards low frequencies) */
274    if (tmpene < candidate[l]->ene) {
[96fb8ad]275      tmpl = l;
276      tmpene = candidate[l]->ene;
277    }
278  }
279  //p->candidates=candidate;
280  //p->peaks=peaks;
281  p->goodcandidate = tmpl;
282}
283
284/** T=quadpick(X): return indices of elements of X which are peaks and positive
285 * exact peak positions are retrieved by quadratic interpolation
286 *
[b050e8e]287 * \bug peak-picking too picky, sometimes counts too many peaks ?
[96fb8ad]288 */
[fddfa64]289uint_t
290aubio_pitchmcomb_quadpick (aubio_spectralpeak_t * spectral_peaks, fvec_t * X)
291{
[96fb8ad]292  uint_t i, j, ispeak, count = 0;
[fddfa64]293  for (i = 0; i < X->channels; i++)
294    for (j = 1; j < X->length - 1; j++) {
295      ispeak = fvec_peakpick (X, j);
[96fb8ad]296      if (ispeak) {
297        count += ispeak;
[fddfa64]298        spectral_peaks[count - 1].bin = j;
299        spectral_peaks[count - 1].ebin = fvec_quadint (X, j, i) - 1.;
[96fb8ad]300      }
301    }
302  return count;
303}
304
305/* get predominant partial */
[fddfa64]306uint_t
307aubio_pitchmcomb_get_root_peak (aubio_spectralpeak_t * peaks, uint_t length)
308{
309  uint_t i, pos = 0;
[96fb8ad]310  smpl_t tmp = 0.;
[fddfa64]311  for (i = 0; i < length; i++)
[96fb8ad]312    if (tmp <= peaks[i].mag) {
313      pos = i;
314      tmp = peaks[i].mag;
315    }
316  return pos;
317}
318
[fddfa64]319void
320aubio_pitchmcomb_sort_peak (aubio_spectralpeak_t * peaks, uint_t nbins)
321{
322  qsort (peaks, nbins, sizeof (aubio_spectralpeak_t),
[96fb8ad]323      aubio_pitchmcomb_sort_peak_comp);
324}
[fddfa64]325
326static sint_t
327aubio_pitchmcomb_sort_peak_comp (const void *x, const void *y)
328{
329  return (((aubio_spectralpeak_t *) y)->mag -
330      ((aubio_spectralpeak_t *) x)->mag);
[96fb8ad]331}
332
333
[fddfa64]334void
335aubio_pitchmcomb_sort_cand_ene (aubio_spectralcandidate_t ** candidates,
336    uint_t nbins)
337{
[96fb8ad]338  uint_t cur = 0;
339  uint_t run = 0;
[fddfa64]340  for (cur = 0; cur < nbins; cur++) {
[96fb8ad]341    run = cur + 1;
[fddfa64]342    for (run = cur; run < nbins; run++) {
343      if (candidates[run]->ene > candidates[cur]->ene)
344        CAND_SWAP (candidates[run], candidates[cur]);
[96fb8ad]345    }
346  }
347}
348
349
[fddfa64]350void
351aubio_pitchmcomb_sort_cand_freq (aubio_spectralcandidate_t ** candidates,
352    uint_t nbins)
353{
[96fb8ad]354  uint_t cur = 0;
355  uint_t run = 0;
[fddfa64]356  for (cur = 0; cur < nbins; cur++) {
[96fb8ad]357    run = cur + 1;
[fddfa64]358    for (run = cur; run < nbins; run++) {
359      if (candidates[run]->ebin < candidates[cur]->ebin)
360        CAND_SWAP (candidates[run], candidates[cur]);
[96fb8ad]361    }
362  }
363}
364
[fddfa64]365aubio_pitchmcomb_t *
366new_aubio_pitchmcomb (uint_t bufsize, uint_t hopsize, uint_t channels)
367{
368  aubio_pitchmcomb_t *p = AUBIO_NEW (aubio_pitchmcomb_t);
[7f3ccc5e]369  /* bug: should check if size / 8 > post+pre+1 */
[9638f84]370  uint_t i, j;
[96fb8ad]371  uint_t spec_size;
[fddfa64]372  p->spec_partition = 4;
373  p->ncand = 5;
374  p->npartials = 5;
375  p->cutoff = 1.;
376  p->threshold = 0.01;
377  p->win_post = 8;
378  p->win_pre = 7;
[e5757cf]379  // p->tau              = samplerate/bufsize;
[fddfa64]380  p->alpha = 9.;
381  p->goodcandidate = 0;
382  p->phasefreq = bufsize / hopsize / TWO_PI;
383  p->phasediff = TWO_PI * hopsize / bufsize;
384  spec_size = bufsize / p->spec_partition;
[96fb8ad]385  //p->pickerfn = quadpick;
386  //p->biquad = new_biquad(0.1600,0.3200,0.1600, -0.5949, 0.2348);
387  /* allocate temp memory */
[fddfa64]388  p->newmag = new_fvec (spec_size, 1);
[96fb8ad]389  /* array for median */
[fddfa64]390  p->scratch = new_fvec (spec_size, 1);
[d94f98b]391  /* array for phase */
[fddfa64]392  p->theta = new_fvec (spec_size, channels);
[96fb8ad]393  /* array for adaptative threshold */
[fddfa64]394  p->scratch2 = new_fvec (p->win_post + p->win_pre + 1, 1);
[96fb8ad]395  /* array of spectral peaks */
[fddfa64]396  p->peaks = AUBIO_ARRAY (aubio_spectralpeak_t, spec_size);
[9638f84]397  for (i = 0; i < spec_size; i++) {
398    p->peaks[i].bin = 0.;
399    p->peaks[i].ebin = 0.;
400    p->peaks[i].mag = 0.;
401  }
[96fb8ad]402  /* array of pointers to spectral candidates */
[fddfa64]403  p->candidates = AUBIO_ARRAY (aubio_spectralcandidate_t *, p->ncand);
404  for (i = 0; i < p->ncand; i++) {
405    p->candidates[i] = AUBIO_NEW (aubio_spectralcandidate_t);
406    p->candidates[i]->ecomb = AUBIO_ARRAY (smpl_t, spec_size);
407    for (j = 0; j < spec_size; j++) {
[9638f84]408      p->candidates[i]->ecomb[j] = 0.;
409    }
410    p->candidates[i]->ene = 0.;
411    p->candidates[i]->ebin = 0.;
412    p->candidates[i]->len = 0.;
[96fb8ad]413  }
414  return p;
415}
416
[7a04950]417
[fddfa64]418void
419del_aubio_pitchmcomb (aubio_pitchmcomb_t * p)
420{
[7a04950]421  uint_t i;
[fddfa64]422  del_fvec (p->newmag);
423  del_fvec (p->scratch);
424  del_fvec (p->theta);
425  del_fvec (p->scratch2);
426  AUBIO_FREE (p->peaks);
427  for (i = 0; i < p->ncand; i++) {
428    AUBIO_FREE (p->candidates[i]->ecomb);
429    AUBIO_FREE (p->candidates[i]);
[7a04950]430  }
[fddfa64]431  AUBIO_FREE (p->candidates);
432  AUBIO_FREE (p);
[7a04950]433}
Note: See TracBrowser for help on using the repository browser.