annotate src/FeatureExtractor.cpp @ 103:593054bf6476 feature_conditioner

Pull out normalisation and specdiff stuff into FeatureConditioner
author Chris Cannam
date Thu, 04 Dec 2014 13:05:16 +0000
parents b9aa663a607b
children cfba9aec7569
rev   line source
Chris@37 1 /* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */
Chris@37 2
Chris@37 3 /*
Chris@37 4 Vamp feature extraction plugin using the MATCH audio alignment
Chris@37 5 algorithm.
Chris@37 6
Chris@37 7 Centre for Digital Music, Queen Mary, University of London.
Chris@37 8 This file copyright 2007 Simon Dixon, Chris Cannam and QMUL.
Chris@37 9
Chris@37 10 This program is free software; you can redistribute it and/or
Chris@37 11 modify it under the terms of the GNU General Public License as
Chris@37 12 published by the Free Software Foundation; either version 2 of the
Chris@37 13 License, or (at your option) any later version. See the file
Chris@37 14 COPYING included with this distribution for more information.
Chris@37 15 */
Chris@37 16
Chris@37 17 #include "FeatureExtractor.h"
Chris@37 18
Chris@37 19 #include <iostream>
Chris@37 20
Chris@37 21 #include <cstdlib>
Chris@37 22 #include <cassert>
Chris@37 23 #include <cmath>
Chris@37 24
Chris@37 25 using namespace std;
Chris@37 26
Chris@37 27 FeatureExtractor::FeatureExtractor(Parameters parameters) :
Chris@103 28 m_params(parameters)
Chris@37 29 {
Chris@74 30 m_featureSize = getFeatureSizeFor(parameters);
Chris@37 31 makeFreqMap();
Chris@37 32 }
Chris@37 33
Chris@74 34 int
Chris@74 35 FeatureExtractor::getFeatureSizeFor(Parameters parameters)
Chris@74 36 {
Chris@74 37 if (parameters.useChromaFrequencyMap) {
Chris@74 38 return 13;
Chris@74 39 } else {
Chris@74 40 return 84;
Chris@74 41 }
Chris@74 42 }
Chris@74 43
Chris@37 44 void
Chris@37 45 FeatureExtractor::makeFreqMap()
Chris@37 46 {
Chris@37 47 m_freqMap = vector<int>(m_params.fftSize / 2 + 1, 0);
Chris@37 48
Chris@37 49 if (m_params.useChromaFrequencyMap) {
Chris@37 50 #ifdef DEBUG_MATCHER
Chris@37 51 cerr << "makeFreqMap: calling makeChromaFrequencyMap" << endl;
Chris@37 52 #endif
Chris@37 53 makeChromaFrequencyMap();
Chris@37 54 } else {
Chris@37 55 #ifdef DEBUG_MATCHER
Chris@37 56 cerr << "makeFreqMap: calling makeStandardFrequencyMap" << endl;
Chris@37 57 #endif
Chris@37 58 makeStandardFrequencyMap();
Chris@37 59 }
Chris@37 60 }
Chris@37 61
Chris@37 62 void
Chris@37 63 FeatureExtractor::makeStandardFrequencyMap()
Chris@37 64 {
Chris@37 65 double binWidth = m_params.sampleRate / m_params.fftSize;
Chris@37 66 int crossoverBin = (int)(2 / (pow(2, 1/12.0) - 1));
Chris@37 67 int crossoverMidi = lrint(log(crossoverBin*binWidth/440.0)/
Chris@37 68 log(2.0) * 12 + 69);
Chris@37 69
Chris@37 70 // freq = 440 * Math.pow(2, (midi-69)/12.0) / binWidth;
Chris@37 71
Chris@37 72 int i = 0;
Chris@37 73 while (i <= crossoverBin) {
Chris@37 74 m_freqMap[i] = i;
Chris@37 75 ++i;
Chris@37 76 }
Chris@37 77
Chris@37 78 while (i <= m_params.fftSize/2) {
Chris@37 79 double midi = log(i*binWidth/440.0) / log(2.0) * 12 + 69;
Chris@37 80 if (midi > 127) midi = 127;
Chris@40 81 int target = crossoverBin + lrint(midi) - crossoverMidi;
Chris@40 82 if (target >= m_featureSize) target = m_featureSize - 1;
Chris@40 83 m_freqMap[i++] = target;
Chris@37 84 }
Chris@37 85 }
Chris@37 86
Chris@37 87 void
Chris@37 88 FeatureExtractor::makeChromaFrequencyMap()
Chris@37 89 {
Chris@37 90 double binWidth = m_params.sampleRate / m_params.fftSize;
Chris@37 91 int crossoverBin = (int)(1 / (pow(2, 1/12.0) - 1));
Chris@37 92 int i = 0;
Chris@37 93 while (i <= crossoverBin) {
Chris@37 94 m_freqMap[i++] = 0;
Chris@37 95 }
Chris@37 96 while (i <= m_params.fftSize/2) {
Chris@37 97 double midi = log(i*binWidth/440.0) / log(2.0) * 12 + 69;
Chris@37 98 m_freqMap[i++] = (lrint(midi)) % 12 + 1;
Chris@37 99 }
Chris@37 100 }
Chris@37 101
Chris@37 102 vector<double>
Chris@37 103 FeatureExtractor::process(const vector<double> &real, const vector<double> &imag)
Chris@37 104 {
Chris@37 105 vector<double> frame(m_featureSize, 0.0);
Chris@37 106
Chris@37 107 for (int i = 0; i <= m_params.fftSize/2; i++) {
Chris@37 108 double mag = real[i] * real[i] + imag[i] * imag[i];
Chris@37 109 frame[m_freqMap[i]] += mag;
Chris@37 110 }
Chris@37 111
Chris@103 112 return frame;
Chris@74 113 }
Chris@74 114
Chris@74 115 vector<double>
Chris@74 116 FeatureExtractor::process(const float *cframe)
Chris@74 117 {
Chris@74 118 vector<double> frame(m_featureSize, 0.0);
Chris@74 119
Chris@74 120 for (int i = 0; i <= m_params.fftSize/2; i++) {
Chris@74 121 double mag = cframe[i*2] * cframe[i*2] + cframe[i*2+1] * cframe[i*2+1];
Chris@74 122 frame[m_freqMap[i]] += mag;
Chris@74 123 }
Chris@74 124
Chris@103 125 return frame;
Chris@74 126 }
Chris@74 127