[7524d0b] | 1 | /* |
---|
[df53936] | 2 | Copyright (C) 2006-2013 Paul Brossier <piem@aubio.org> |
---|
[7524d0b] | 3 | |
---|
[e6a78ea] | 4 | This file is part of aubio. |
---|
[7524d0b] | 5 | |
---|
[e6a78ea] | 6 | aubio is free software: you can redistribute it and/or modify |
---|
| 7 | it under the terms of the GNU General Public License as published by |
---|
| 8 | the Free Software Foundation, either version 3 of the License, or |
---|
| 9 | (at your option) any later version. |
---|
[7524d0b] | 10 | |
---|
[e6a78ea] | 11 | aubio is distributed in the hope that it will be useful, |
---|
| 12 | but WITHOUT ANY WARRANTY; without even the implied warranty of |
---|
| 13 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
---|
| 14 | GNU General Public License for more details. |
---|
| 15 | |
---|
| 16 | You should have received a copy of the GNU General Public License |
---|
| 17 | along with aubio. If not, see <http://www.gnu.org/licenses/>. |
---|
[7524d0b] | 18 | |
---|
| 19 | */ |
---|
| 20 | |
---|
| 21 | #include "aubio_priv.h" |
---|
[6c7d49b] | 22 | #include "fvec.h" |
---|
| 23 | #include "cvec.h" |
---|
[31907fd] | 24 | #include "spectral/specdesc.h" |
---|
[32d6958] | 25 | #include "spectral/phasevoc.h" |
---|
[9f060d1] | 26 | #include "spectral/awhitening.h" |
---|
[3e17aed] | 27 | #include "onset/peakpicker.h" |
---|
[7524d0b] | 28 | #include "mathutils.h" |
---|
[32d6958] | 29 | #include "onset/onset.h" |
---|
[7524d0b] | 30 | |
---|
[989bf7f] | 31 | /** structure to store object state */ |
---|
[7524d0b] | 32 | struct _aubio_onset_t { |
---|
[989bf7f] | 33 | aubio_pvoc_t * pv; /**< phase vocoder */ |
---|
[df53936] | 34 | aubio_specdesc_t * od; /**< spectral descriptor */ |
---|
[8766cb6] | 35 | aubio_peakpicker_t * pp; /**< peak picker */ |
---|
[989bf7f] | 36 | cvec_t * fftgrain; /**< phase vocoder output */ |
---|
[df53936] | 37 | fvec_t * desc; /**< spectral description */ |
---|
[989bf7f] | 38 | smpl_t silence; /**< silence threhsold */ |
---|
| 39 | uint_t minioi; /**< minimum inter onset interval */ |
---|
[f5e0a54] | 40 | uint_t delay; /**< constant delay, in samples, removed from detected onset times */ |
---|
[e4f142c] | 41 | uint_t samplerate; /**< sampling rate of the input signal */ |
---|
[f5e0a54] | 42 | uint_t hop_size; /**< number of samples between two runs */ |
---|
| 43 | |
---|
| 44 | uint_t total_frames; /**< total number of frames processed since the beginning */ |
---|
| 45 | uint_t last_onset; /**< last detected onset location, in frames */ |
---|
[9f060d1] | 46 | |
---|
| 47 | uint_t apply_adaptive_whitening; |
---|
| 48 | aubio_spectral_whitening_t *spectral_whitening; |
---|
[7524d0b] | 49 | }; |
---|
| 50 | |
---|
| 51 | /* execute onset detection function on iput buffer */ |
---|
[a72f3f1] | 52 | void aubio_onset_do (aubio_onset_t *o, fvec_t * input, fvec_t * onset) |
---|
[7524d0b] | 53 | { |
---|
[56ef7e1] | 54 | smpl_t isonset = 0; |
---|
[7524d0b] | 55 | aubio_pvoc_do (o->pv,input, o->fftgrain); |
---|
[9f060d1] | 56 | /* |
---|
| 57 | if (apply_filtering) { |
---|
| 58 | } |
---|
| 59 | if (apply_compression) { |
---|
| 60 | } |
---|
| 61 | */ |
---|
| 62 | if (o->apply_adaptive_whitening) { |
---|
| 63 | aubio_spectral_whitening_do(o->spectral_whitening, o->fftgrain); |
---|
| 64 | } |
---|
[df53936] | 65 | aubio_specdesc_do (o->od, o->fftgrain, o->desc); |
---|
| 66 | aubio_peakpicker_do(o->pp, o->desc, onset); |
---|
[0b9a02a] | 67 | isonset = onset->data[0]; |
---|
[0f6f2e6] | 68 | if (isonset > 0.) { |
---|
[7524d0b] | 69 | if (aubio_silence_detection(input, o->silence)==1) { |
---|
[df53936] | 70 | //AUBIO_DBG ("silent onset, not marking as onset\n"); |
---|
[7524d0b] | 71 | isonset = 0; |
---|
| 72 | } else { |
---|
[8b884ef] | 73 | uint_t new_onset = o->total_frames + (uint_t)ROUND(isonset * o->hop_size); |
---|
[35f73b8c] | 74 | if (o->last_onset + o->minioi < new_onset) { |
---|
[df53936] | 75 | //AUBIO_DBG ("accepted detection, marking as onset\n"); |
---|
[35f73b8c] | 76 | o->last_onset = new_onset; |
---|
[7524d0b] | 77 | } else { |
---|
[df53936] | 78 | //AUBIO_DBG ("doubled onset, not marking as onset\n"); |
---|
[7524d0b] | 79 | isonset = 0; |
---|
| 80 | } |
---|
| 81 | } |
---|
| 82 | } else { |
---|
[35f73b8c] | 83 | // we are at the beginning of the file, and we don't find silence |
---|
[28c066e] | 84 | if (o->total_frames <= o->delay && o->last_onset < o ->minioi && aubio_silence_detection(input, o->silence) == 0) { |
---|
[35f73b8c] | 85 | //AUBIO_DBG ("beginning of file is not silent, marking as onset\n"); |
---|
[f5e0a54] | 86 | isonset = o->delay / o->hop_size; |
---|
| 87 | o->last_onset = o->delay; |
---|
[376946a] | 88 | } |
---|
[7524d0b] | 89 | } |
---|
[0b9a02a] | 90 | onset->data[0] = isonset; |
---|
[f5e0a54] | 91 | o->total_frames += o->hop_size; |
---|
[7524d0b] | 92 | return; |
---|
| 93 | } |
---|
| 94 | |
---|
[8b884ef] | 95 | uint_t aubio_onset_get_last (aubio_onset_t *o) |
---|
[f5e0a54] | 96 | { |
---|
| 97 | return o->last_onset - o->delay; |
---|
| 98 | } |
---|
| 99 | |
---|
[8b884ef] | 100 | smpl_t aubio_onset_get_last_s (aubio_onset_t *o) |
---|
[f5e0a54] | 101 | { |
---|
[8b884ef] | 102 | return aubio_onset_get_last (o) / (smpl_t) (o->samplerate); |
---|
[f5e0a54] | 103 | } |
---|
| 104 | |
---|
[8b884ef] | 105 | smpl_t aubio_onset_get_last_ms (aubio_onset_t *o) |
---|
[f5e0a54] | 106 | { |
---|
[47e067b] | 107 | return aubio_onset_get_last_s (o) * 1000.; |
---|
[f5e0a54] | 108 | } |
---|
| 109 | |
---|
[6338636] | 110 | uint_t aubio_onset_set_silence(aubio_onset_t * o, smpl_t silence) { |
---|
[7524d0b] | 111 | o->silence = silence; |
---|
[6338636] | 112 | return AUBIO_OK; |
---|
[7524d0b] | 113 | } |
---|
| 114 | |
---|
[96a96d7] | 115 | smpl_t aubio_onset_get_silence(aubio_onset_t * o) { |
---|
| 116 | return o->silence; |
---|
| 117 | } |
---|
| 118 | |
---|
[6338636] | 119 | uint_t aubio_onset_set_threshold(aubio_onset_t * o, smpl_t threshold) { |
---|
[8f14c6e] | 120 | aubio_peakpicker_set_threshold(o->pp, threshold); |
---|
[6338636] | 121 | return AUBIO_OK; |
---|
[7524d0b] | 122 | } |
---|
| 123 | |
---|
[10b11d6] | 124 | smpl_t aubio_onset_get_threshold(aubio_onset_t * o) { |
---|
| 125 | return aubio_peakpicker_get_threshold(o->pp); |
---|
| 126 | } |
---|
| 127 | |
---|
[6338636] | 128 | uint_t aubio_onset_set_minioi(aubio_onset_t * o, uint_t minioi) { |
---|
[35f73b8c] | 129 | o->minioi = minioi; |
---|
[6338636] | 130 | return AUBIO_OK; |
---|
[7524d0b] | 131 | } |
---|
| 132 | |
---|
[f5e0a54] | 133 | uint_t aubio_onset_get_minioi(aubio_onset_t * o) { |
---|
| 134 | return o->minioi; |
---|
| 135 | } |
---|
| 136 | |
---|
[35f73b8c] | 137 | uint_t aubio_onset_set_minioi_s(aubio_onset_t * o, smpl_t minioi) { |
---|
| 138 | return aubio_onset_set_minioi (o, minioi * o->samplerate); |
---|
| 139 | } |
---|
| 140 | |
---|
| 141 | smpl_t aubio_onset_get_minioi_s(aubio_onset_t * o) { |
---|
| 142 | return aubio_onset_get_minioi (o) / (smpl_t) o->samplerate; |
---|
| 143 | } |
---|
| 144 | |
---|
| 145 | uint_t aubio_onset_set_minioi_ms(aubio_onset_t * o, smpl_t minioi) { |
---|
| 146 | return aubio_onset_set_minioi_s (o, minioi / 1000.); |
---|
| 147 | } |
---|
| 148 | |
---|
| 149 | smpl_t aubio_onset_get_minioi_ms(aubio_onset_t * o) { |
---|
| 150 | return aubio_onset_get_minioi_s (o) * 1000.; |
---|
| 151 | } |
---|
| 152 | |
---|
[f5e0a54] | 153 | uint_t aubio_onset_set_delay(aubio_onset_t * o, uint_t delay) { |
---|
| 154 | o->delay = delay; |
---|
| 155 | return AUBIO_OK; |
---|
| 156 | } |
---|
| 157 | |
---|
| 158 | uint_t aubio_onset_get_delay(aubio_onset_t * o) { |
---|
| 159 | return o->delay; |
---|
| 160 | } |
---|
| 161 | |
---|
| 162 | uint_t aubio_onset_set_delay_s(aubio_onset_t * o, smpl_t delay) { |
---|
| 163 | return aubio_onset_set_delay (o, delay * o->samplerate); |
---|
| 164 | } |
---|
| 165 | |
---|
| 166 | smpl_t aubio_onset_get_delay_s(aubio_onset_t * o) { |
---|
| 167 | return aubio_onset_get_delay (o) / (smpl_t) o->samplerate; |
---|
| 168 | } |
---|
| 169 | |
---|
| 170 | uint_t aubio_onset_set_delay_ms(aubio_onset_t * o, smpl_t delay) { |
---|
| 171 | return aubio_onset_set_delay_s (o, delay / 1000.); |
---|
| 172 | } |
---|
| 173 | |
---|
| 174 | smpl_t aubio_onset_get_delay_ms(aubio_onset_t * o) { |
---|
| 175 | return aubio_onset_get_delay_s (o) * 1000.; |
---|
| 176 | } |
---|
| 177 | |
---|
[35f73b8c] | 178 | smpl_t aubio_onset_get_descriptor(aubio_onset_t * o) { |
---|
[df53936] | 179 | return o->desc->data[0]; |
---|
[35f73b8c] | 180 | } |
---|
| 181 | |
---|
| 182 | smpl_t aubio_onset_get_thresholded_descriptor(aubio_onset_t * o) { |
---|
| 183 | fvec_t * thresholded = aubio_peakpicker_get_thresholded_input(o->pp); |
---|
| 184 | return thresholded->data[0]; |
---|
| 185 | } |
---|
| 186 | |
---|
[7524d0b] | 187 | /* Allocate memory for an onset detection */ |
---|
[b4f5967] | 188 | aubio_onset_t * new_aubio_onset (char_t * onset_mode, |
---|
[0b9a02a] | 189 | uint_t buf_size, uint_t hop_size, uint_t samplerate) |
---|
[7524d0b] | 190 | { |
---|
| 191 | aubio_onset_t * o = AUBIO_NEW(aubio_onset_t); |
---|
[892c369] | 192 | |
---|
| 193 | /* check parameters are valid */ |
---|
| 194 | if ((sint_t)hop_size < 1) { |
---|
| 195 | AUBIO_ERR("onset: got hop_size %d, but can not be < 1\n", hop_size); |
---|
| 196 | goto beach; |
---|
| 197 | } else if ((sint_t)buf_size < 1) { |
---|
| 198 | AUBIO_ERR("onset: got buffer_size %d, but can not be < 1\n", buf_size); |
---|
| 199 | goto beach; |
---|
| 200 | } else if (buf_size < hop_size) { |
---|
| 201 | AUBIO_ERR("onset: hop size (%d) is larger than win size (%d)\n", buf_size, hop_size); |
---|
| 202 | goto beach; |
---|
| 203 | } else if ((sint_t)samplerate < 1) { |
---|
| 204 | AUBIO_ERR("onset: samplerate (%d) can not be < 1\n", samplerate); |
---|
| 205 | goto beach; |
---|
| 206 | } |
---|
| 207 | |
---|
[8f14c6e] | 208 | /* store creation parameters */ |
---|
[35f73b8c] | 209 | o->samplerate = samplerate; |
---|
| 210 | o->hop_size = hop_size; |
---|
[8f14c6e] | 211 | |
---|
| 212 | /* allocate memory */ |
---|
[35f73b8c] | 213 | o->pv = new_aubio_pvoc(buf_size, o->hop_size); |
---|
[0b9a02a] | 214 | o->pp = new_aubio_peakpicker(); |
---|
| 215 | o->od = new_aubio_specdesc(onset_mode,buf_size); |
---|
| 216 | o->fftgrain = new_cvec(buf_size); |
---|
[df53936] | 217 | o->desc = new_fvec(1); |
---|
[8f14c6e] | 218 | |
---|
| 219 | /* set some default parameter */ |
---|
| 220 | aubio_onset_set_threshold (o, 0.3); |
---|
[cbda661] | 221 | aubio_onset_set_delay(o, 4.3 * hop_size); |
---|
[8f14c6e] | 222 | aubio_onset_set_minioi_ms(o, 20.); |
---|
| 223 | aubio_onset_set_silence(o, -70.); |
---|
| 224 | |
---|
[9f060d1] | 225 | o->spectral_whitening = new_aubio_spectral_whitening(buf_size, hop_size, samplerate); |
---|
| 226 | o->apply_adaptive_whitening = 1; |
---|
| 227 | |
---|
[8f14c6e] | 228 | /* initialize internal variables */ |
---|
| 229 | o->last_onset = 0; |
---|
| 230 | o->total_frames = 0; |
---|
[7524d0b] | 231 | return o; |
---|
[892c369] | 232 | |
---|
| 233 | beach: |
---|
| 234 | AUBIO_FREE(o); |
---|
| 235 | return NULL; |
---|
[7524d0b] | 236 | } |
---|
| 237 | |
---|
| 238 | void del_aubio_onset (aubio_onset_t *o) |
---|
| 239 | { |
---|
[9f060d1] | 240 | del_aubio_spectral_whitening(o->spectral_whitening); |
---|
[31907fd] | 241 | del_aubio_specdesc(o->od); |
---|
[7524d0b] | 242 | del_aubio_peakpicker(o->pp); |
---|
| 243 | del_aubio_pvoc(o->pv); |
---|
[df53936] | 244 | del_fvec(o->desc); |
---|
[7524d0b] | 245 | del_cvec(o->fftgrain); |
---|
| 246 | AUBIO_FREE(o); |
---|
| 247 | } |
---|