1 | /* |
---|
2 | Copyright (C) 2003-2015 Paul Brossier <piem@aubio.org> |
---|
3 | |
---|
4 | This file is part of aubio. |
---|
5 | |
---|
6 | aubio is free software: you can redistribute it and/or modify |
---|
7 | it under the terms of the GNU General Public License as published by |
---|
8 | the Free Software Foundation, either version 3 of the License, or |
---|
9 | (at your option) any later version. |
---|
10 | |
---|
11 | aubio is distributed in the hope that it will be useful, |
---|
12 | but WITHOUT ANY WARRANTY; without even the implied warranty of |
---|
13 | MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
---|
14 | GNU General Public License for more details. |
---|
15 | |
---|
16 | You should have received a copy of the GNU General Public License |
---|
17 | along with aubio. If not, see <http://www.gnu.org/licenses/>. |
---|
18 | |
---|
19 | */ |
---|
20 | |
---|
21 | /** @file |
---|
22 | * various functions useful in audio signal processing |
---|
23 | */ |
---|
24 | |
---|
25 | #ifndef AUBIO_MUSICUTILS_H |
---|
26 | #define AUBIO_MUSICUTILS_H |
---|
27 | |
---|
28 | #ifdef __cplusplus |
---|
29 | extern "C" { |
---|
30 | #endif |
---|
31 | |
---|
32 | /** create window |
---|
33 | |
---|
34 | \param window_type type of the window to create |
---|
35 | \param size length of the window to create (see fvec_set_window()) |
---|
36 | |
---|
37 | */ |
---|
38 | fvec_t *new_aubio_window (char_t * window_type, uint_t size); |
---|
39 | |
---|
40 | /** set elements of a vector to window coefficients |
---|
41 | |
---|
42 | \param window exsting ::fvec_t to use |
---|
43 | \param window_type type of the window to create |
---|
44 | |
---|
45 | List of available window types: "rectangle", "hamming", "hanning", |
---|
46 | "hanningz", "blackman", "blackman_harris", "gaussian", "welch", "parzen", |
---|
47 | "default". |
---|
48 | |
---|
49 | "default" is equivalent to "hanningz". |
---|
50 | |
---|
51 | References: |
---|
52 | |
---|
53 | - <a href="http://en.wikipedia.org/wiki/Window_function">Window |
---|
54 | function</a> on Wikipedia |
---|
55 | - Amalia de Götzen, Nicolas Bernardini, and Daniel Arfib. Traditional (?) |
---|
56 | implementations of a phase vocoder: the tricks of the trade. In Proceedings of |
---|
57 | the International Conference on Digital Audio Effects (DAFx-00), pages 37–44, |
---|
58 | Uni- versity of Verona, Italy, 2000. |
---|
59 | (<a href="http://www.cs.princeton.edu/courses/archive/spr09/cos325/Bernardini.pdf"> |
---|
60 | pdf</a>) |
---|
61 | |
---|
62 | */ |
---|
63 | uint_t fvec_set_window (fvec_t * window, char_t * window_type); |
---|
64 | |
---|
65 | /** compute the principal argument |
---|
66 | |
---|
67 | This function maps the input phase to its corresponding value wrapped in the |
---|
68 | range \f$ [-\pi, \pi] \f$. |
---|
69 | |
---|
70 | \param phase unwrapped phase to map to the unit circle |
---|
71 | |
---|
72 | \return equivalent phase wrapped to the unit circle |
---|
73 | |
---|
74 | */ |
---|
75 | smpl_t aubio_unwrap2pi (smpl_t phase); |
---|
76 | |
---|
77 | /** convert frequency bin to midi value */ |
---|
78 | smpl_t aubio_bintomidi (smpl_t bin, smpl_t samplerate, smpl_t fftsize); |
---|
79 | |
---|
80 | /** convert midi value to frequency bin */ |
---|
81 | smpl_t aubio_miditobin (smpl_t midi, smpl_t samplerate, smpl_t fftsize); |
---|
82 | |
---|
83 | /** convert frequency bin to frequency (Hz) */ |
---|
84 | smpl_t aubio_bintofreq (smpl_t bin, smpl_t samplerate, smpl_t fftsize); |
---|
85 | |
---|
86 | /** convert frequency (Hz) to frequency bin */ |
---|
87 | smpl_t aubio_freqtobin (smpl_t freq, smpl_t samplerate, smpl_t fftsize); |
---|
88 | |
---|
89 | /** convert frequency (Hz) to mel |
---|
90 | |
---|
91 | \param freq input frequency, in Hz |
---|
92 | |
---|
93 | \return output mel |
---|
94 | |
---|
95 | Converts a scalar from the frequency domain to the mel scale using Slaney |
---|
96 | Auditory Toolbox's implementation: |
---|
97 | |
---|
98 | If \f$ f < 1000 \f$, \f$ m = 3 f / 200 \f$. |
---|
99 | |
---|
100 | If \f$ f >= 1000 \f$, \f$ m = 1000 + 27 \frac{{ln}(f) - ln(1000))} |
---|
101 | {{ln}(6400) - ln(1000)} |
---|
102 | \f$ |
---|
103 | |
---|
104 | See also |
---|
105 | -------- |
---|
106 | |
---|
107 | aubio_meltohz(), aubio_hztomel_htk(). |
---|
108 | |
---|
109 | */ |
---|
110 | smpl_t aubio_hztomel (smpl_t freq); |
---|
111 | |
---|
112 | /** convert mel to frequency (Hz) |
---|
113 | |
---|
114 | \param mel input mel |
---|
115 | |
---|
116 | \return output frequency, in Hz |
---|
117 | |
---|
118 | Converts a scalar from the mel scale to the frequency domain using Slaney |
---|
119 | Auditory Toolbox's implementation: |
---|
120 | |
---|
121 | If \f$ f < 1000 \f$, \f$ f = 200 m/3 \f$. |
---|
122 | |
---|
123 | If \f$ f \geq 1000 \f$, \f$ f = 1000 + \left(\frac{6400}{1000}\right) |
---|
124 | ^{\frac{m - 1000}{27}} \f$ |
---|
125 | |
---|
126 | See also |
---|
127 | -------- |
---|
128 | |
---|
129 | aubio_hztomel(), aubio_meltohz_htk(). |
---|
130 | |
---|
131 | References |
---|
132 | ---------- |
---|
133 | |
---|
134 | Malcolm Slaney, *Auditory Toolbox Version 2, Technical Report #1998-010* |
---|
135 | https://engineering.purdue.edu/~malcolm/interval/1998-010/ |
---|
136 | |
---|
137 | */ |
---|
138 | smpl_t aubio_meltohz (smpl_t mel); |
---|
139 | |
---|
140 | /** convert frequency (Hz) to mel |
---|
141 | |
---|
142 | \param freq input frequency, in Hz |
---|
143 | |
---|
144 | \return output mel |
---|
145 | |
---|
146 | Converts a scalar from the frequency domain to the mel scale, using the |
---|
147 | equation defined by O'Shaughnessy, as implemented in the HTK speech |
---|
148 | recognition toolkit: |
---|
149 | |
---|
150 | \f$ m = 1127 + ln(1 + \frac{f}{700}) \f$ |
---|
151 | |
---|
152 | See also |
---|
153 | -------- |
---|
154 | |
---|
155 | aubio_meltohz_htk(), aubio_hztomel(). |
---|
156 | |
---|
157 | References |
---|
158 | ---------- |
---|
159 | |
---|
160 | Douglas O'Shaughnessy (1987). *Speech communication: human and machine*. |
---|
161 | Addison-Wesley. p. 150. ISBN 978-0-201-16520-3. |
---|
162 | |
---|
163 | HTK Speech Recognition Toolkit: http://htk.eng.cam.ac.uk/ |
---|
164 | |
---|
165 | */ |
---|
166 | smpl_t aubio_hztomel_htk (smpl_t freq); |
---|
167 | |
---|
168 | /** convert mel to frequency (Hz) |
---|
169 | |
---|
170 | \param mel input mel |
---|
171 | |
---|
172 | \return output frequency, in Hz |
---|
173 | |
---|
174 | Converts a scalar from the mel scale to the frequency domain, using the |
---|
175 | equation defined by O'Shaughnessy, as implemented in the HTK speech |
---|
176 | recognition toolkit: |
---|
177 | |
---|
178 | \f$ f = 700 * {e}^\left(\frac{f}{1127} - 1\right) \f$ |
---|
179 | |
---|
180 | See also |
---|
181 | -------- |
---|
182 | |
---|
183 | aubio_hztomel_htk(), aubio_meltohz(). |
---|
184 | |
---|
185 | */ |
---|
186 | smpl_t aubio_meltohz_htk (smpl_t mel); |
---|
187 | |
---|
188 | /** convert frequency (Hz) to midi value (0-128) */ |
---|
189 | smpl_t aubio_freqtomidi (smpl_t freq); |
---|
190 | |
---|
191 | /** convert midi value (0-128) to frequency (Hz) */ |
---|
192 | smpl_t aubio_miditofreq (smpl_t midi); |
---|
193 | |
---|
194 | /** clean up cached memory at the end of program |
---|
195 | |
---|
196 | This function should be used at the end of programs to purge all cached |
---|
197 | memory. So far it is only useful to clean FFTW's cache. |
---|
198 | |
---|
199 | */ |
---|
200 | void aubio_cleanup (void); |
---|
201 | |
---|
202 | /** zero-crossing rate (ZCR) |
---|
203 | |
---|
204 | The zero-crossing rate is the number of times a signal changes sign, |
---|
205 | divided by the length of this signal. |
---|
206 | |
---|
207 | \param v vector to compute ZCR from |
---|
208 | |
---|
209 | \return zero-crossing rate of v |
---|
210 | |
---|
211 | */ |
---|
212 | smpl_t aubio_zero_crossing_rate (fvec_t * v); |
---|
213 | |
---|
214 | /** compute sound level on a linear scale |
---|
215 | |
---|
216 | This gives the average of the square amplitudes. |
---|
217 | |
---|
218 | \param v vector to compute level from |
---|
219 | |
---|
220 | \return level of v |
---|
221 | |
---|
222 | */ |
---|
223 | smpl_t aubio_level_lin (const fvec_t * v); |
---|
224 | |
---|
225 | /** compute sound pressure level (SPL) in dB |
---|
226 | |
---|
227 | This quantity is often wrongly called 'loudness'. |
---|
228 | |
---|
229 | This gives ten times the log10 of the average of the square amplitudes. |
---|
230 | |
---|
231 | \param v vector to compute dB SPL from |
---|
232 | |
---|
233 | \return level of v in dB SPL |
---|
234 | |
---|
235 | */ |
---|
236 | smpl_t aubio_db_spl (const fvec_t * v); |
---|
237 | |
---|
238 | /** check if buffer level in dB SPL is under a given threshold |
---|
239 | |
---|
240 | \param v vector to get level from |
---|
241 | \param threshold threshold in dB SPL |
---|
242 | |
---|
243 | \return 1 if level is under the given threshold, 0 otherwise |
---|
244 | |
---|
245 | */ |
---|
246 | uint_t aubio_silence_detection (const fvec_t * v, smpl_t threshold); |
---|
247 | |
---|
248 | /** get buffer level if level >= threshold, 1. otherwise |
---|
249 | |
---|
250 | \param v vector to get level from |
---|
251 | \param threshold threshold in dB SPL |
---|
252 | |
---|
253 | \return level in dB SPL if level >= threshold, 1. otherwise |
---|
254 | |
---|
255 | */ |
---|
256 | smpl_t aubio_level_detection (const fvec_t * v, smpl_t threshold); |
---|
257 | |
---|
258 | /** clamp the values of a vector within the range [-abs(max), abs(max)] |
---|
259 | |
---|
260 | \param in vector to clamp |
---|
261 | \param absmax maximum value over which input vector elements should be clamped |
---|
262 | |
---|
263 | */ |
---|
264 | void fvec_clamp(fvec_t *in, smpl_t absmax); |
---|
265 | |
---|
266 | #ifdef __cplusplus |
---|
267 | } |
---|
268 | #endif |
---|
269 | |
---|
270 | #endif /* AUBIO_MUSICUTILS_H */ |
---|