annotate src/init.c @ 161:246c203cc733

Add wavelet-based pitch tracker
author Jamie Bullock <jamie@jamiebullock.com>
date Fri, 31 May 2013 22:44:03 +0100
parents 71870680f7c1
children 39d168ee5917
rev   line source
jamie@141 1 /*
jamie@141 2 * Copyright (C) 2012 Jamie Bullock
jamie@140 3 *
jamie@141 4 * Permission is hereby granted, free of charge, to any person obtaining a copy
jamie@141 5 * of this software and associated documentation files (the "Software"), to
jamie@141 6 * deal in the Software without restriction, including without limitation the
jamie@141 7 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
jamie@141 8 * sell copies of the Software, and to permit persons to whom the Software is
jamie@141 9 * furnished to do so, subject to the following conditions:
jamie@1 10 *
jamie@141 11 * The above copyright notice and this permission notice shall be included in
jamie@141 12 * all copies or substantial portions of the Software.
jamie@1 13 *
jamie@141 14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
jamie@141 15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
jamie@141 16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
jamie@141 17 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
jamie@141 18 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
jamie@141 19 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
jamie@141 20 * IN THE SOFTWARE.
jamie@1 21 *
jamie@1 22 */
jamie@1 23
jamie@107 24 /* init.c: defines initialisation and free functions. Also contains library constructor routine. */
jamie@1 25
jamie@98 26 #ifdef HAVE_CONFIG_H
jamie@150 27 #include <config.h>
jamie@98 28 #endif
jamie@98 29
jamie@1 30 #include <math.h>
jamie@26 31 #include <stdlib.h>
jamie@140 32 #include <stdio.h>
jamie@140 33
jamie@150 34 #include "fft.h"
jamie@1 35
jamie@159 36 #include "../xtract/libxtract.h"
jamie@107 37 #include "xtract_window_private.h"
jamie@161 38 #include "xtract_scalar_private.h"
jamie@102 39 #define DEFINE_GLOBALS
jamie@98 40 #include "xtract_globals_private.h"
jamie@98 41
jamie@98 42
jamie@150 43
jamie@150 44 #ifdef USE_OOURA
jamie@150 45 void xtract_init_ooura_data(xtract_ooura_data *ooura_data, unsigned int N)
jamie@150 46 {
jamie@150 47 ooura_data->ooura_ip = (int *)calloc((2 + sqrt(N)), sizeof(int));
jamie@150 48 ooura_data->ooura_w = (double *)calloc((N - 1), sizeof(double));
jamie@150 49 ooura_data->initialised = true;
jamie@150 50 }
jamie@150 51
jamie@150 52 void xtract_free_ooura_data(xtract_ooura_data *ooura_data)
jamie@150 53 {
jamie@150 54 free(ooura_data->ooura_ip);
jamie@150 55 free(ooura_data->ooura_w);
jamie@150 56 ooura_data->ooura_ip = NULL;
jamie@150 57 ooura_data->ooura_w = NULL;
jamie@150 58 ooura_data->initialised = false;
jamie@150 59 }
jamie@150 60
jamie@150 61 int xtract_init_ooura_(int N, int feature_name)
jamie@150 62 {
jamie@150 63
jamie@150 64 int M = N >> 1;
jamie@150 65
jamie@150 66 if(feature_name == XTRACT_AUTOCORRELATION_FFT)
jamie@150 67 {
jamie@150 68 M = N; /* allow for zero padding */
jamie@150 69 }
jamie@150 70
jamie@150 71 switch(feature_name)
jamie@150 72 {
jamie@150 73 case XTRACT_SPECTRUM:
jamie@150 74 if(ooura_data_spectrum.initialised)
jamie@150 75 {
jamie@150 76 xtract_free_ooura_data(&ooura_data_spectrum);
jamie@150 77 }
jamie@150 78 xtract_init_ooura_data(&ooura_data_spectrum, M);
jamie@150 79 break;
jamie@150 80 case XTRACT_AUTOCORRELATION_FFT:
jamie@150 81 if(ooura_data_autocorrelation_fft.initialised)
jamie@150 82 {
jamie@150 83 xtract_free_ooura_data(&ooura_data_autocorrelation_fft);
jamie@150 84 }
jamie@150 85 xtract_init_ooura_data(&ooura_data_autocorrelation_fft, M);
jamie@150 86 break;
jamie@150 87 case XTRACT_DCT:
jamie@150 88 if(ooura_data_dct.initialised)
jamie@150 89 {
jamie@150 90 xtract_free_ooura_data(&ooura_data_dct);
jamie@150 91 }
jamie@150 92 xtract_init_ooura_data(&ooura_data_dct, M);
jamie@150 93 case XTRACT_MFCC:
jamie@150 94 if(ooura_data_mfcc.initialised)
jamie@150 95 {
jamie@150 96 xtract_free_ooura_data(&ooura_data_mfcc);
jamie@150 97 }
jamie@150 98 xtract_init_ooura_data(&ooura_data_mfcc, M);
jamie@150 99 break;
jamie@150 100 }
jamie@150 101
jamie@150 102 return XTRACT_SUCCESS;
jamie@150 103 }
jamie@150 104
jamie@150 105 void xtract_free_ooura_(void)
jamie@150 106 {
jamie@150 107 if(ooura_data_spectrum.initialised)
jamie@150 108 {
jamie@150 109 xtract_free_ooura_data(&ooura_data_spectrum);
jamie@150 110 }
jamie@150 111 if(ooura_data_autocorrelation_fft.initialised)
jamie@150 112 {
jamie@150 113 xtract_free_ooura_data(&ooura_data_autocorrelation_fft);
jamie@150 114 }
jamie@150 115 if(ooura_data_dct.initialised)
jamie@150 116 {
jamie@150 117 xtract_free_ooura_data(&ooura_data_dct);
jamie@150 118 }
jamie@150 119 if(ooura_data_mfcc.initialised)
jamie@150 120 {
jamie@150 121 xtract_free_ooura_data(&ooura_data_mfcc);
jamie@150 122 }
jamie@150 123 }
jamie@150 124
jamie@150 125 #else
jamie@150 126
jamie@150 127 void xtract_init_vdsp_data(xtract_vdsp_data *vdsp_data, unsigned int N)
jamie@150 128 {
jamie@150 129 vdsp_data->setup = vDSP_create_fftsetupD(log2f(N), FFT_RADIX2);
jamie@150 130 vdsp_data->fft.realp = (double *) malloc((N >> 1) * sizeof(double));
jamie@150 131 vdsp_data->fft.imagp = (double *) malloc((N >> 1) * sizeof(double));
jamie@150 132 vdsp_data->log2N = log2f(N);
jamie@150 133 vdsp_data->initialised = true;
jamie@150 134 }
jamie@150 135
jamie@150 136 void xtract_free_vdsp_data(xtract_vdsp_data *vdsp_data)
jamie@150 137 {
jamie@150 138 free(vdsp_data->fft.realp);
jamie@150 139 free(vdsp_data->fft.imagp);
jamie@150 140 vDSP_destroy_fftsetupD(vdsp_data->setup);
jamie@150 141 vdsp_data->fft.realp = NULL;
jamie@150 142 vdsp_data->fft.imagp = NULL;
jamie@150 143 vdsp_data->initialised = false;
jamie@150 144 }
jamie@150 145
jamie@150 146 int xtract_init_vdsp_(int N, int feature_name)
jamie@150 147 {
jamie@150 148
jamie@150 149 int M = N >> 1;
jamie@150 150
jamie@150 151 if(feature_name == XTRACT_AUTOCORRELATION_FFT)
jamie@150 152 {
jamie@150 153 M = N; /* allow for zero padding */
jamie@150 154 }
jamie@150 155
jamie@150 156 switch(feature_name)
jamie@150 157 {
jamie@150 158 case XTRACT_SPECTRUM:
jamie@150 159 if(vdsp_data_spectrum.initialised)
jamie@150 160 {
jamie@150 161 xtract_free_vdsp_data(&vdsp_data_spectrum);
jamie@150 162 }
jamie@150 163 xtract_init_vdsp_data(&vdsp_data_spectrum, M);
jamie@150 164 break;
jamie@150 165 case XTRACT_AUTOCORRELATION_FFT:
jamie@150 166 if(vdsp_data_autocorrelation_fft.initialised)
jamie@150 167 {
jamie@150 168 xtract_free_vdsp_data(&vdsp_data_autocorrelation_fft);
jamie@150 169 }
jamie@150 170 xtract_init_vdsp_data(&vdsp_data_autocorrelation_fft, M);
jamie@150 171 break;
jamie@150 172 case XTRACT_DCT:
jamie@150 173 if(vdsp_data_dct.initialised)
jamie@150 174 {
jamie@150 175 xtract_free_vdsp_data(&vdsp_data_dct);
jamie@150 176 }
jamie@150 177 xtract_init_vdsp_data(&vdsp_data_dct, M);
jamie@150 178 case XTRACT_MFCC:
jamie@150 179 if(vdsp_data_mfcc.initialised)
jamie@150 180 {
jamie@150 181 xtract_free_vdsp_data(&vdsp_data_mfcc);
jamie@150 182 }
jamie@150 183 xtract_init_vdsp_data(&vdsp_data_mfcc, M);
jamie@150 184 break;
jamie@150 185 }
jamie@150 186
jamie@150 187 return XTRACT_SUCCESS;
jamie@150 188 }
jamie@150 189
jamie@150 190 void xtract_free_vdsp_(void)
jamie@150 191 {
jamie@150 192 if(vdsp_data_spectrum.initialised)
jamie@150 193 {
jamie@150 194 xtract_free_vdsp_data(&vdsp_data_spectrum);
jamie@150 195 }
jamie@150 196 if(vdsp_data_autocorrelation_fft.initialised)
jamie@150 197 {
jamie@150 198 xtract_free_vdsp_data(&vdsp_data_autocorrelation_fft);
jamie@150 199 }
jamie@150 200 if(vdsp_data_dct.initialised)
jamie@150 201 {
jamie@150 202 xtract_free_vdsp_data(&vdsp_data_dct);
jamie@150 203 }
jamie@150 204 if(vdsp_data_mfcc.initialised)
jamie@150 205 {
jamie@150 206 xtract_free_vdsp_data(&vdsp_data_mfcc);
jamie@150 207 }
jamie@150 208 }
jamie@150 209
jamie@150 210
jamie@150 211 #endif
jamie@150 212
jamie@150 213 int xtract_init_fft(int N, int feature_name)
jamie@150 214 {
jamie@150 215 if(!xtract_is_poweroftwo(N))
jamie@150 216 {
jamie@150 217 fprintf(stderr,
jamie@150 218 "libxtract: error: only power-of-two FFT sizes are supported by Ooura FFT.\n");
jamie@150 219 exit(EXIT_FAILURE);
jamie@150 220 }
jamie@150 221 #ifdef USE_OOURA
jamie@150 222 return xtract_init_ooura_(N, feature_name);
jamie@150 223 #else
jamie@150 224 return xtract_init_vdsp_(N, feature_name);
jamie@150 225 #endif
jamie@150 226 }
jamie@150 227
jamie@150 228 void xtract_free_fft(void)
jamie@150 229 {
jamie@150 230 #ifdef USE_OOURA
jamie@150 231 xtract_free_ooura_();
jamie@150 232 #else
jamie@150 233 xtract_free_vdsp_();
jamie@150 234 #endif
jamie@150 235 }
jamie@150 236
jamie@150 237
jamie@150 238 int xtract_init_bark(int N, double sr, int *band_limits)
jamie@150 239 {
jamie@150 240
jamie@150 241 double edges[] = {0, 100, 200, 300, 400, 510, 630, 770, 920, 1080, 1270, 1480, 1720, 2000, 2320, 2700, 3150, 3700, 4400, 5300, 6400, 7700, 9500, 12000, 15500, 20500, 27000}; /* Takes us up to sr = 54kHz (CCRMA: JOS)*/
jamie@150 242
jamie@150 243 int bands = XTRACT_BARK_BANDS;
jamie@150 244
jamie@150 245 while(bands--)
jamie@150 246 band_limits[bands] = edges[bands] / sr * N;
jamie@150 247 /*FIX shohuld use rounding, but couldn't get it to work */
jamie@150 248
jamie@150 249 return XTRACT_SUCCESS;
jamie@150 250 }
jamie@150 251
jamie@146 252 int xtract_init_mfcc(int N, double nyquist, int style, double freq_min, double freq_max, int freq_bands, double **fft_tables)
jamie@140 253 {
jamie@98 254
jamie@140 255 int n, i, k, *fft_peak, M, next_peak;
jamie@146 256 double norm, mel_freq_max, mel_freq_min, norm_fact, height, inc, val,
jamie@107 257 freq_bw_mel, *mel_peak, *height_norm, *lin_peak;
jamie@1 258
jamie@1 259 mel_peak = height_norm = lin_peak = NULL;
jamie@1 260 fft_peak = NULL;
jamie@140 261 norm = 1;
jamie@1 262
jamie@1 263 mel_freq_max = 1127 * log(1 + freq_max / 700);
jamie@1 264 mel_freq_min = 1127 * log(1 + freq_min / 700);
jamie@1 265 freq_bw_mel = (mel_freq_max - mel_freq_min) / freq_bands;
jamie@1 266
jamie@146 267 mel_peak = (double *)malloc((freq_bands + 2) * sizeof(double));
jamie@1 268 /* +2 for zeros at start and end */
jamie@146 269 lin_peak = (double *)malloc((freq_bands + 2) * sizeof(double));
jamie@1 270 fft_peak = (int *)malloc((freq_bands + 2) * sizeof(int));
jamie@146 271 height_norm = (double *)malloc(freq_bands * sizeof(double));
jamie@1 272
jamie@140 273 if(mel_peak == NULL || height_norm == NULL ||
jamie@107 274 lin_peak == NULL || fft_peak == NULL)
jamie@107 275 return XTRACT_MALLOC_FAILED;
jamie@107 276
jamie@1 277 M = N >> 1;
jamie@1 278
jamie@1 279 mel_peak[0] = mel_freq_min;
danstowell@95 280 lin_peak[0] = freq_min; // === 700 * (exp(mel_peak[0] / 1127) - 1);
jamie@1 281 fft_peak[0] = lin_peak[0] / nyquist * M;
jamie@1 282
jamie@1 283
jamie@140 284 for (n = 1; n < freq_bands + 2; n++)
jamie@140 285 {
jamie@140 286 //roll out peak locations - mel, linear and linear on fft window scale
jamie@1 287 mel_peak[n] = mel_peak[n - 1] + freq_bw_mel;
jamie@1 288 lin_peak[n] = 700 * (exp(mel_peak[n] / 1127) -1);
jamie@1 289 fft_peak[n] = lin_peak[n] / nyquist * M;
jamie@1 290 }
jamie@1 291
jamie@140 292 for (n = 0; n < freq_bands; n++)
jamie@140 293 {
danstowell@100 294 //roll out normalised gain of each peak
jamie@140 295 if (style == XTRACT_EQUAL_GAIN)
jamie@140 296 {
jamie@140 297 height = 1;
jamie@1 298 norm_fact = norm;
jamie@1 299 }
jamie@140 300 else
jamie@140 301 {
jamie@1 302 height = 2 / (lin_peak[n + 2] - lin_peak[n]);
jamie@1 303 norm_fact = norm / (2 / (lin_peak[2] - lin_peak[0]));
jamie@1 304 }
jamie@1 305 height_norm[n] = height * norm_fact;
jamie@1 306 }
jamie@1 307
jamie@1 308 i = 0;
jamie@107 309
jamie@140 310 for(n = 0; n < freq_bands; n++)
jamie@140 311 {
jamie@107 312
jamie@107 313 // calculate the rise increment
danstowell@95 314 if(n==0)
danstowell@95 315 inc = height_norm[n] / fft_peak[n];
danstowell@95 316 else
jamie@1 317 inc = height_norm[n] / (fft_peak[n] - fft_peak[n - 1]);
jamie@140 318 val = 0;
jamie@107 319
jamie@107 320 // zero the start of the array
jamie@107 321 for(k = 0; k < i; k++)
jamie@146 322 fft_tables[n][k] = 0.0;
jamie@107 323
jamie@107 324 // fill in the rise
jamie@140 325 for(; i <= fft_peak[n]; i++)
jamie@140 326 {
jamie@1 327 fft_tables[n][i] = val;
jamie@1 328 val += inc;
jamie@1 329 }
jamie@107 330
danstowell@95 331 // calculate the fall increment
jamie@1 332 inc = height_norm[n] / (fft_peak[n + 1] - fft_peak[n]);
jamie@107 333
jamie@1 334 val = 0;
jamie@107 335 next_peak = fft_peak[n + 1];
jamie@107 336
jamie@140 337 // reverse fill the 'fall'
jamie@140 338 for(i = next_peak; i > fft_peak[n]; i--)
jamie@140 339 {
jamie@1 340 fft_tables[n][i] = val;
jamie@1 341 val += inc;
jamie@1 342 }
jamie@39 343
jamie@107 344 // zero the rest of the array
jamie@107 345 for(k = next_peak + 1; k < N; k++)
jamie@146 346 fft_tables[n][k] = 0.0;
jamie@1 347 }
jamie@1 348
jamie@98 349
jamie@98 350 /* Initialise the fft_plan for the DCT */
jamie@140 351 /*
jamie@140 352 * Ooura doesn't support non power-of-two DCT
jamie@98 353 xtract_init_fft(freq_bands, XTRACT_MFCC);
jamie@140 354 */
jamie@98 355
jamie@1 356 free(mel_peak);
jamie@1 357 free(lin_peak);
jamie@1 358 free(height_norm);
jamie@1 359 free(fft_peak);
jamie@1 360
jamie@56 361 return XTRACT_SUCCESS;
jamie@1 362
jamie@1 363 }
jamie@1 364
jamie@161 365 int xtract_init_wavelet_f0_state(void)
jamie@161 366 {
jamie@161 367 dywapitch_inittracking(&wavelet_f0_state);
jamie@161 368 }
jamie@161 369
jamie@146 370 double *xtract_init_window(const int N, const int type)
jamie@140 371 {
jamie@146 372 double *window;
jamie@107 373
jamie@146 374 window = malloc(N * sizeof(double));
jamie@107 375
jamie@140 376 switch (type)
jamie@140 377 {
jamie@140 378 case XTRACT_GAUSS:
jamie@140 379 gauss(window, N, 0.4);
jamie@140 380 break;
jamie@140 381 case XTRACT_HAMMING:
jamie@140 382 hamming(window, N);
jamie@140 383 break;
jamie@140 384 case XTRACT_HANN:
jamie@140 385 hann(window, N);
jamie@140 386 break;
jamie@140 387 case XTRACT_BARTLETT:
jamie@140 388 bartlett(window, N);
jamie@140 389 break;
jamie@140 390 case XTRACT_TRIANGULAR:
jamie@140 391 triangular(window, N);
jamie@140 392 break;
jamie@140 393 case XTRACT_BARTLETT_HANN:
jamie@140 394 bartlett_hann(window, N);
jamie@140 395 break;
jamie@140 396 case XTRACT_BLACKMAN:
jamie@140 397 blackman(window, N);
jamie@140 398 break;
jamie@140 399 case XTRACT_KAISER:
jamie@140 400 kaiser(window, N, 3 * PI);
jamie@140 401 break;
jamie@140 402 case XTRACT_BLACKMAN_HARRIS:
jamie@140 403 blackman_harris(window, N);
jamie@140 404 break;
jamie@140 405 default:
jamie@140 406 hann(window, N);
jamie@140 407 break;
jamie@107 408 }
jamie@107 409
jamie@107 410 return window;
jamie@107 411 }
jamie@107 412
jamie@146 413 void xtract_free_window(double *window)
jamie@140 414 {
jamie@107 415 free(window);
jamie@107 416 }
jamie@107 417
jamie@102 418 #ifdef __GNUC__
jamie@102 419 __attribute__((constructor)) void init()
jamie@102 420 #else
jamie@140 421 void _init()ยท
jamie@102 422 #endif
jamie@102 423 {
jamie@150 424 #ifdef USE_OOURA
jamie@140 425 ooura_data_dct.initialised = false;
jamie@140 426 ooura_data_spectrum.initialised = false;
jamie@140 427 ooura_data_autocorrelation_fft.initialised = false;
jamie@140 428 ooura_data_mfcc.initialised = false;
jamie@150 429 #else
jamie@150 430 vdsp_data_dct.initialised = false;
jamie@150 431 vdsp_data_spectrum.initialised = false;
jamie@150 432 vdsp_data_autocorrelation_fft.initialised = false;
jamie@150 433 vdsp_data_mfcc.initialised = false;
jamie@150 434 #endif
jamie@102 435 }