annotate examples/simpletest/simpletest.cpp @ 285:89fe52066db1 tip master

MSCV missing ssize_t fix
author Jamie Bullock <jamie@jamiebullock.com>
date Tue, 16 Jul 2019 18:29:20 +0100
parents 8c768f32a6a8
children
rev   line source
jamie@235 1 /*
jamie@235 2 * Copyright (C) 2012 Jamie Bullock
jamie@235 3 *
jamie@235 4 * Permission is hereby granted, free of charge, to any person obtaining a copy
jamie@235 5 * of this software and associated documentation files (the "Software"), to
jamie@235 6 * deal in the Software without restriction, including without limitation the
jamie@235 7 * rights to use, copy, modify, merge, publish, distribute, sublicense, and/or
jamie@235 8 * sell copies of the Software, and to permit persons to whom the Software is
jamie@235 9 * furnished to do so, subject to the following conditions:
jamie@235 10 *
jamie@235 11 * The above copyright notice and this permission notice shall be included in
jamie@235 12 * all copies or substantial portions of the Software.
jamie@235 13 *
jamie@235 14 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
jamie@235 15 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
jamie@235 16 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
jamie@235 17 * AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
jamie@235 18 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
jamie@235 19 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS
jamie@235 20 * IN THE SOFTWARE.
jamie@235 21 *
jamie@235 22 */
jamie@235 23
jamie@235 24 #include <iostream>
jamie@235 25
jamie@235 26 #include <stdio.h>
jamie@235 27 #include <stdlib.h>
jamie@235 28 #include <math.h>
jamie@235 29 #include <stdbool.h>
jamie@235 30
jamie@235 31 #include "xtract/libxtract.h"
jamie@235 32 #include "xtract/xtract_stateful.h"
jamie@235 33 #include "xtract/xtract_scalar.h"
jamie@244 34 #include "xtract/xtract_helper.h"
jamie@235 35 #include "WaveFile.h"
jamie@235 36
jamie@235 37 #ifndef M_PI
jamie@235 38 #define M_PI 3.14159265358979323846264338327
jamie@235 39 #endif
jamie@235 40
jamie@235 41 using namespace std;
jamie@235 42
jamie@235 43 typedef enum waveform_type_
jamie@235 44 {
jamie@235 45 SINE,
jamie@235 46 SAWTOOTH,
jamie@235 47 SQUARE,
jamie@235 48 NOISE
jamie@235 49 }
jamie@235 50 waveform_type;
jamie@235 51
jamie@235 52 #define BLOCKSIZE 512
jamie@235 53 #define MAVG_COUNT 10
jamie@244 54 #define HALF_BLOCKSIZE (BLOCKSIZE >> 1)
jamie@235 55 #define SAMPLERATE 44100
jamie@235 56 #define PERIOD 102
jamie@235 57 #define MFCC_FREQ_BANDS 13
jamie@235 58 #define MFCC_FREQ_MIN 20
jamie@235 59 #define MFCC_FREQ_MAX 20000
jamie@235 60
jamie@235 61
jamie@235 62 double wavetable[BLOCKSIZE];
jamie@235 63
jamie@235 64 void fill_wavetable(const float frequency, waveform_type type)
jamie@235 65 {
jamie@235 66
jamie@235 67 int samples_per_period = SAMPLERATE / frequency;
jamie@235 68
jamie@235 69 for (int i = 0; i < BLOCKSIZE; ++i)
jamie@235 70 {
jamie@235 71 int phase = i % samples_per_period;
jamie@235 72
jamie@235 73 switch (type)
jamie@235 74 {
jamie@235 75 case SINE:
jamie@235 76 wavetable[i] = sin((phase / (double)PERIOD) * 2 * M_PI);
jamie@235 77 break;
jamie@235 78 case SQUARE:
jamie@235 79 if (phase < (samples_per_period / 2.f))
jamie@235 80 {
jamie@235 81 wavetable[i] = -1.0;
jamie@235 82 }
jamie@235 83 else
jamie@235 84 {
jamie@235 85 wavetable[i] = 1.0;
jamie@235 86 }
jamie@235 87 break;
jamie@235 88 case SAWTOOTH:
jamie@235 89 wavetable[i] = ((phase / (double)PERIOD) * 2) - 1.;
jamie@235 90 break;
jamie@235 91 case NOISE:
jamie@235 92 wavetable[i] = ((random() % 1000) / 500.0) - 1;
jamie@235 93 break;
jamie@235 94 }
jamie@235 95 }
jamie@235 96 }
jamie@235 97
jamie@235 98 void print_wavetable(void)
jamie@235 99 {
jamie@235 100 for (int i = 0; i < BLOCKSIZE; ++i)
jamie@235 101 {
jamie@235 102 printf("%f\n", wavetable[i]);
jamie@235 103 }
jamie@235 104 }
jamie@235 105
jamie@235 106 int main(void)
jamie@235 107 {
jamie@235 108 double mean = 0.0;
jamie@235 109 double f0 = 0.0;
jamie@235 110 double midicents = 0.0;
jamie@235 111 double flux = 0.0;
jamie@235 112 double centroid = 0.0;
jamie@235 113 double lowest = 0.0;
jamie@235 114 double spectrum[BLOCKSIZE] = {0};
jamie@235 115 double windowed[BLOCKSIZE] = {0};
jamie@235 116 double peaks[BLOCKSIZE] = {0};
jamie@235 117 double harmonics[BLOCKSIZE] = {0};
jamie@235 118 double subframes_windowed[BLOCKSIZE] = {0};
jamie@235 119 double subframes_spectrum[BLOCKSIZE] = {0};
jamie@235 120 double difference[HALF_BLOCKSIZE] = {0};
jamie@235 121 double lastn[MAVG_COUNT] = {0};
jamie@235 122 double *window = NULL;
jamie@235 123 double *window_subframe = NULL;
jamie@235 124 double mfccs[MFCC_FREQ_BANDS] = {0};
jamie@235 125 double argd[4] = {0};
jamie@235 126 double samplerate = 44100.0;
jamie@235 127 double prev_note = 0.0;
jamie@235 128 int n;
jamie@235 129 int rv = XTRACT_SUCCESS;
jamie@235 130 double last_found_peak_time = 0.0;
jamie@235 131 WaveFile wavFile("test.wav");
jamie@235 132 xtract_mel_filter mel_filters;
jamie@235 133 xtract_last_n_state *last_n_state = xtract_last_n_state_new(MAVG_COUNT);
jamie@235 134
jamie@235 135 if (!wavFile.IsLoaded())
jamie@235 136 {
jamie@235 137 return EXIT_FAILURE;
jamie@235 138 }
jamie@235 139
jamie@235 140 float *wavData = (float *)wavFile.GetData(); // assume 32-bit float
jamie@235 141 std::size_t wavBytes = wavFile.GetDataSize();
jamie@235 142 uint64_t wavSamples = wavBytes / sizeof(float);
jamie@235 143 double data[wavSamples];
jamie@235 144
jamie@235 145 for (n = 0; n < wavSamples; ++n)
jamie@235 146 {
jamie@235 147 data[n] = (double)wavData[n];
jamie@235 148 }
jamie@235 149 // Convert to double
jamie@235 150
jamie@235 151
jamie@235 152 /* Allocate Mel filters */
jamie@235 153 mel_filters.n_filters = MFCC_FREQ_BANDS;
jamie@235 154 mel_filters.filters = (double **)malloc(MFCC_FREQ_BANDS * sizeof(double *));
jamie@235 155 for(uint8_t k = 0; k < MFCC_FREQ_BANDS; ++k)
jamie@235 156 {
jamie@235 157 mel_filters.filters[k] = (double *)malloc(BLOCKSIZE * sizeof(double));
jamie@235 158 }
jamie@235 159
jamie@235 160 xtract_init_mfcc(BLOCKSIZE >> 1, SAMPLERATE >> 1, XTRACT_EQUAL_GAIN, MFCC_FREQ_MIN, MFCC_FREQ_MAX, mel_filters.n_filters, mel_filters.filters);
jamie@235 161
jamie@235 162 /* create the window functions */
jamie@235 163 window = xtract_init_window(BLOCKSIZE, XTRACT_HANN);
jamie@235 164 window_subframe = xtract_init_window(HALF_BLOCKSIZE, XTRACT_HANN);
jamie@235 165 xtract_init_wavelet_f0_state();
jamie@235 166
jamie@235 167 // fill_wavetable(344.53125f, NOISE); // 344.53125f = 128 samples @ 44100 Hz
jamie@235 168 // fill_wavetable(344.53125f, SINE); // 344.53125f = 128 samples @ 44100 Hz
jamie@235 169
jamie@235 170 /*
jamie@235 171 print_wavetable();
jamie@235 172 */
jamie@235 173 std::cout << "File has " << wavSamples << " samples" << std::endl;
jamie@235 174 int peak_found = XTRACT_NO_RESULT;
jamie@235 175
jamie@235 176 for (uint64_t n = 0; (n + BLOCKSIZE) < wavSamples; n += HALF_BLOCKSIZE) // Overlap by HALF_BLOCKSIZE
jamie@235 177 {
jamie@235 178 /* get the F0 */
jamie@235 179 xtract[XTRACT_WAVELET_F0](&data[n], BLOCKSIZE, &samplerate, &f0);
jamie@235 180
jamie@235 181 /* get the F0 as a MIDI note */
jamie@235 182 if (f0 != 0.0)
jamie@235 183 {
jamie@235 184 xtract[XTRACT_MIDICENT](NULL, 0, &f0, &midicents);
jamie@235 185 int note = (int)round(midicents / 100);
jamie@235 186 if (note != prev_note)
jamie@235 187 {
jamie@235 188 printf("Pitch: %d at %f\n", note, n / (float)SAMPLERATE);
jamie@235 189 }
jamie@235 190 prev_note = note;
jamie@235 191 }
jamie@235 192
jamie@235 193 xtract_windowed(&data[n], BLOCKSIZE, window, windowed);
jamie@235 194
jamie@235 195 /* get the spectrum */
jamie@235 196 argd[0] = SAMPLERATE / (double)BLOCKSIZE;
jamie@235 197 argd[1] = XTRACT_MAGNITUDE_SPECTRUM;
jamie@235 198 argd[2] = 0.f; /* DC component - we expect this to zero for square wave */
jamie@235 199 argd[3] = 0.f; /* No Normalisation */
jamie@235 200
jamie@235 201 xtract_init_fft(BLOCKSIZE, XTRACT_SPECTRUM);
jamie@235 202 xtract[XTRACT_SPECTRUM](windowed, BLOCKSIZE, &argd[0], spectrum);
jamie@235 203 xtract_free_fft();
jamie@235 204
jamie@235 205 xtract[XTRACT_SPECTRAL_CENTROID](spectrum, BLOCKSIZE, NULL, &centroid);
jamie@235 206
jamie@235 207 argd[1] = 10.0; /* peak threshold as % of maximum peak */
jamie@235 208 xtract[XTRACT_PEAK_SPECTRUM](spectrum, BLOCKSIZE / 2, argd, peaks);
jamie@235 209
jamie@235 210 argd[0] = f0;
jamie@235 211 argd[1] = .3; /* harmonic threshold */
jamie@235 212 xtract[XTRACT_HARMONIC_SPECTRUM](peaks, BLOCKSIZE, argd, harmonics);
jamie@235 213
jamie@235 214 /* compute the MFCCs */
jamie@235 215 xtract_mfcc(spectrum, BLOCKSIZE >> 1, &mel_filters, mfccs);
jamie@235 216
jamie@235 217 double gated[BLOCKSIZE] = {0};
jamie@235 218 double block_max = 0.0;
jamie@235 219
jamie@235 220 /* crude noise gate */
jamie@235 221 for (uint16_t k = 0; k < BLOCKSIZE; ++k)
jamie@235 222 {
jamie@235 223 if (fabs(data[n+k]) > block_max)
jamie@235 224 {
jamie@235 225 block_max = fabs(data[n+k]);
jamie@235 226 }
jamie@235 227
jamie@235 228 if (data[n+k] > .1)
jamie@235 229 {
jamie@235 230 gated[k] = data[n+k];
jamie@235 231 }
jamie@235 232 }
jamie@235 233
jamie@235 234 /* normalise */
jamie@235 235 double norm_factor = block_max > 0.0 ? 1.0 / block_max : 0.0;
jamie@235 236
jamie@235 237 for (uint16_t k = 0; k < BLOCKSIZE; ++k)
jamie@235 238 {
jamie@235 239 gated[k] *= norm_factor;
jamie@235 240 }
jamie@235 241
jamie@235 242 /* compute Spectral Flux */
jamie@235 243 argd[0] = SAMPLERATE / HALF_BLOCKSIZE;
jamie@235 244 argd[1] = XTRACT_LOG_POWER_SPECTRUM;
jamie@235 245 argd[2] = 0.f; /* DC component */
jamie@235 246 argd[3] = 1.f; /* Yes Normalisation */
jamie@235 247
jamie@235 248 xtract_features_from_subframes(gated, BLOCKSIZE, XTRACT_WINDOWED, window_subframe, subframes_windowed);
jamie@235 249 xtract_init_fft(HALF_BLOCKSIZE, XTRACT_SPECTRUM);
jamie@235 250 xtract_features_from_subframes(subframes_windowed, BLOCKSIZE, XTRACT_SPECTRUM, argd, subframes_spectrum);
jamie@235 251 xtract_free_fft();
jamie@235 252
jamie@244 253 argd[0] = 0.5; /* smoothing factor */
jamie@244 254
jamie@244 255 /* smooth the amplitude components of the first and second spectra */
jamie@244 256 xtract_smoothed(subframes_spectrum, HALF_BLOCKSIZE >> 1, argd, subframes_spectrum);
jamie@244 257 xtract_smoothed(subframes_spectrum + HALF_BLOCKSIZE, HALF_BLOCKSIZE >> 1, argd, subframes_spectrum + HALF_BLOCKSIZE);
jamie@244 258
jamie@244 259 /* difference between the two spectra */
jamie@235 260 xtract_difference_vector(subframes_spectrum, BLOCKSIZE, NULL, difference);
jamie@235 261
jamie@235 262 argd[0] = .25; /* norm order */
jamie@235 263 argd[1] = XTRACT_POSITIVE_SLOPE; /* positive slope */
jamie@235 264 argd[2] = 1; /* normalise */
jamie@235 265
jamie@235 266 /* Right shift HALF_BLOCKSIZE because we only want amplitudes not frequencies */
jamie@235 267 xtract_flux(difference, HALF_BLOCKSIZE >> 1, argd, &flux);
jamie@235 268
jamie@235 269 xtract_last_n(last_n_state, &flux, MAVG_COUNT, NULL, lastn);
jamie@235 270
jamie@235 271 argd[0] = 10; /* flux threshold */
jamie@235 272 double flux_current = 0.0;
jamie@235 273
jamie@235 274 peak_found = xtract_peak(lastn, MAVG_COUNT, argd, &flux_current);
jamie@235 275
jamie@235 276 if (peak_found == XTRACT_SUCCESS)
jamie@235 277 {
jamie@235 278 double peak_time = n / (float)SAMPLERATE;
jamie@235 279 if (peak_time - last_found_peak_time > .05 || peak_time < .05)
jamie@235 280 {
jamie@235 281 printf("Onset at %f seconds\n", n / (float)SAMPLERATE);
jamie@235 282 last_found_peak_time = peak_time;
jamie@235 283 }
jamie@235 284 }
jamie@235 285 }
jamie@235 286
jamie@235 287 /* cleanup */
jamie@235 288 for(n = 0; n < MFCC_FREQ_BANDS; ++n)
jamie@235 289 {
jamie@235 290 free(mel_filters.filters[n]);
jamie@235 291 }
jamie@235 292 free(mel_filters.filters);
jamie@235 293
jamie@235 294 xtract_free_window(window);
jamie@235 295 xtract_free_window(window_subframe);
jamie@235 296
jamie@235 297 return 0;
jamie@235 298
jamie@235 299 }