annotate src/Matcher.cpp @ 46:b0ebc3e2c016 refactors

Some fixes: int -> float
author Chris Cannam
date Thu, 13 Nov 2014 15:09:04 +0000
parents a1b7df871496
children 8cbc15519d2c
rev   line source
cannam@0 1 /* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */
cannam@0 2
cannam@0 3 /*
cannam@0 4 Vamp feature extraction plugin using the MATCH audio alignment
cannam@0 5 algorithm.
cannam@0 6
cannam@0 7 Centre for Digital Music, Queen Mary, University of London.
cannam@0 8 This file copyright 2007 Simon Dixon, Chris Cannam and QMUL.
cannam@0 9
cannam@0 10 This program is free software; you can redistribute it and/or
cannam@0 11 modify it under the terms of the GNU General Public License as
cannam@0 12 published by the Free Software Foundation; either version 2 of the
cannam@0 13 License, or (at your option) any later version. See the file
cannam@0 14 COPYING included with this distribution for more information.
cannam@0 15 */
cannam@0 16
cannam@0 17 #include "Matcher.h"
cannam@0 18
cannam@0 19 #include <iostream>
cannam@0 20
cannam@4 21 #include <cstdlib>
Chris@16 22 #include <cassert>
cannam@4 23
Chris@10 24 //#define DEBUG_MATCHER 1
Chris@10 25
Chris@38 26 Matcher::Matcher(Parameters parameters,
Chris@38 27 FeatureExtractor::Parameters feParams,
Chris@38 28 Matcher *p) :
Chris@43 29 m_params(parameters),
Chris@43 30 m_featureExtractor(feParams),
Chris@43 31 m_metric(parameters.distanceNorm)
cannam@0 32 {
Chris@10 33 #ifdef DEBUG_MATCHER
Chris@43 34 cerr << "Matcher::Matcher(" << m_params.sampleRate << ", " << p << ")" << endl;
Chris@10 35 #endif
cannam@0 36
Chris@43 37 m_otherMatcher = p; // the first matcher will need this to be set later
Chris@43 38 m_firstPM = (!p);
Chris@43 39 m_frameCount = 0;
Chris@43 40 m_runCount = 0;
Chris@43 41 m_featureSize = m_featureExtractor.getFeatureSize();
Chris@43 42 m_blockSize = 0;
Chris@23 43
Chris@43 44 m_blockSize = lrint(m_params.blockTime / m_params.hopTime);
Chris@23 45 #ifdef DEBUG_MATCHER
Chris@43 46 cerr << "Matcher: m_blockSize = " << m_blockSize << endl;
Chris@23 47 #endif
Chris@23 48
Chris@43 49 m_initialised = false;
Chris@23 50 }
Chris@23 51
Chris@43 52 Matcher::Matcher(Parameters parameters, Matcher *p, int m_featureSize_) :
Chris@43 53 m_params(parameters),
Chris@43 54 m_featureSize(m_featureSize_),
Chris@43 55 m_featureExtractor(FeatureExtractor::Parameters(m_params.sampleRate, m_params.fftSize)), // unused default config
Chris@43 56 m_metric(parameters.distanceNorm)
Chris@23 57 {
Chris@23 58 #ifdef DEBUG_MATCHER
Chris@43 59 cerr << "Matcher::Matcher(" << m_params.sampleRate << ", " << p << ", " << m_featureSize << ")" << endl;
Chris@23 60 #endif
Chris@23 61
Chris@43 62 m_otherMatcher = p; // the first matcher will need this to be set later
Chris@43 63 m_firstPM = (!p);
Chris@43 64 m_frameCount = 0;
Chris@43 65 m_runCount = 0;
Chris@43 66 m_blockSize = 0;
cannam@0 67
Chris@43 68 m_blockSize = lrint(m_params.blockTime / m_params.hopTime);
Chris@15 69 #ifdef DEBUG_MATCHER
Chris@43 70 cerr << "Matcher: m_blockSize = " << m_blockSize << endl;
Chris@15 71 #endif
cannam@0 72
Chris@43 73 m_initialised = false;
Chris@23 74 }
cannam@0 75
cannam@0 76 Matcher::~Matcher()
cannam@0 77 {
Chris@10 78 #ifdef DEBUG_MATCHER
Chris@15 79 cerr << "Matcher(" << this << ")::~Matcher()" << endl;
Chris@10 80 #endif
cannam@0 81 }
cannam@0 82
cannam@0 83 void
cannam@0 84 Matcher::init()
cannam@0 85 {
Chris@43 86 if (m_initialised) return;
cannam@0 87
Chris@43 88 m_frames = vector<vector<double> >
Chris@43 89 (m_blockSize, vector<double>(m_featureSize, 0));
cannam@0 90
Chris@43 91 m_distXSize = m_blockSize * 2;
Chris@45 92
Chris@41 93 size();
cannam@0 94
Chris@43 95 m_frameCount = 0;
Chris@43 96 m_runCount = 0;
Chris@38 97
Chris@43 98 m_initialised = true;
Chris@16 99 }
Chris@16 100
cannam@0 101 void
Chris@41 102 Matcher::size()
cannam@0 103 {
Chris@43 104 int distSize = (m_params.maxRunCount + 1) * m_blockSize;
Chris@45 105 m_bestPathCost.resize(m_distXSize, vector<float>(distSize, 0));
Chris@45 106 m_distance.resize(m_distXSize, vector<float>(distSize, 0));
Chris@45 107 m_advance.resize(m_distXSize, vector<Advance>(distSize, AdvanceNone));
Chris@43 108 m_distYSizes.resize(m_distXSize, distSize);
Chris@43 109 m_first.resize(m_distXSize, 0);
Chris@43 110 m_last.resize(m_distXSize, 0);
Chris@38 111 }
cannam@0 112
Chris@14 113 vector<double>
Chris@21 114 Matcher::consumeFrame(double *reBuffer, double *imBuffer)
cannam@0 115 {
Chris@43 116 if (!m_initialised) init();
cannam@0 117
Chris@43 118 vector<double> real(reBuffer, reBuffer + m_params.fftSize/2 + 1);
Chris@43 119 vector<double> imag(imBuffer, imBuffer + m_params.fftSize/2 + 1);
Chris@43 120 vector<double> feature = m_featureExtractor.process(real, imag);
Chris@43 121 int frameIndex = m_frameCount % m_blockSize;
Chris@43 122 m_frames[frameIndex] = feature;
Chris@21 123 calcAdvance();
Chris@21 124
Chris@38 125 return feature;
Chris@23 126 }
Chris@21 127
Chris@23 128 void
Chris@23 129 Matcher::consumeFeatureVector(std::vector<double> feature)
Chris@23 130 {
Chris@43 131 if (!m_initialised) init();
Chris@43 132 int frameIndex = m_frameCount % m_blockSize;
Chris@43 133 m_frames[frameIndex] = feature;
Chris@23 134 calcAdvance();
Chris@21 135 }
Chris@21 136
Chris@21 137 void
Chris@21 138 Matcher::calcAdvance()
Chris@21 139 {
Chris@43 140 int frameIndex = m_frameCount % m_blockSize;
Chris@21 141
Chris@43 142 if (m_frameCount >= m_distXSize) {
Chris@43 143 m_distXSize *= 2;
Chris@41 144 size();
cannam@0 145 }
cannam@0 146
Chris@43 147 if (m_firstPM && (m_frameCount >= m_blockSize)) {
cannam@0 148
Chris@43 149 int len = m_last[m_frameCount - m_blockSize] -
Chris@43 150 m_first[m_frameCount - m_blockSize];
cannam@0 151
Chris@43 152 // We need to copy distance[m_frameCount-m_blockSize] to
Chris@43 153 // distance[m_frameCount], and then truncate
Chris@43 154 // distance[m_frameCount-m_blockSize] to its first len elements.
cannam@0 155 // Same for bestPathCost.
cannam@0 156 /*
Chris@43 157 std::cerr << "Matcher(" << this << "): moving " << distYSizes[m_frameCount - m_blockSize] << " from " << m_frameCount - m_blockSize << " to "
Chris@43 158 << m_frameCount << ", allocating " << len << " for "
Chris@43 159 << m_frameCount - m_blockSize << std::endl;
cannam@0 160 */
Chris@43 161 m_distance[m_frameCount] = m_distance[m_frameCount - m_blockSize];
Chris@43 162 m_distance[m_frameCount - m_blockSize].resize(len, 0);
cannam@0 163
Chris@43 164 m_bestPathCost[m_frameCount] = m_bestPathCost[m_frameCount - m_blockSize];
Chris@43 165 m_bestPathCost[m_frameCount - m_blockSize].resize(len, 0);
cannam@0 166
Chris@45 167 m_advance[m_frameCount] = m_advance[m_frameCount - m_blockSize];
Chris@46 168 m_advance[m_frameCount - m_blockSize].resize(len, AdvanceNone);
Chris@45 169
Chris@43 170 m_distYSizes[m_frameCount] = m_distYSizes[m_frameCount - m_blockSize];
Chris@43 171 m_distYSizes[m_frameCount - m_blockSize] = len;
cannam@0 172 }
cannam@0 173
Chris@43 174 int stop = m_otherMatcher->m_frameCount;
Chris@43 175 int index = stop - m_blockSize;
cannam@0 176 if (index < 0)
cannam@0 177 index = 0;
Chris@43 178 m_first[m_frameCount] = index;
Chris@43 179 m_last[m_frameCount] = stop;
cannam@0 180
Chris@46 181 float mn= -1;
Chris@46 182 float mx= -1;
cannam@0 183 for ( ; index < stop; index++) {
Chris@26 184
Chris@45 185 float dMN = m_metric.calcDistance
Chris@43 186 (m_frames[frameIndex],
Chris@45 187 m_otherMatcher->m_frames[index % m_blockSize]);
Chris@26 188
cannam@0 189 if (mx<0)
cannam@0 190 mx = mn = dMN;
cannam@0 191 else if (dMN > mx)
cannam@0 192 mx = dMN;
cannam@0 193 else if (dMN < mn)
cannam@0 194 mn = dMN;
Chris@26 195
Chris@43 196 if ((m_frameCount == 0) && (index == 0)) // first element
Chris@45 197 setValue(0, 0, AdvanceNone, 0, dMN);
Chris@43 198 else if (m_frameCount == 0) // first row
Chris@45 199 setValue(0, index, AdvanceOther,
cannam@0 200 getValue(0, index-1, true), dMN);
cannam@0 201 else if (index == 0) // first column
Chris@45 202 setValue(m_frameCount, index, AdvanceThis,
Chris@43 203 getValue(m_frameCount - 1, 0, true), dMN);
Chris@43 204 else if (index == m_otherMatcher->m_frameCount - m_blockSize) {
cannam@0 205 // missing value(s) due to cutoff
cannam@0 206 // - no previous value in current row (resp. column)
cannam@0 207 // - no diagonal value if prev. dir. == curr. dirn
Chris@46 208 float min2 = getValue(m_frameCount - 1, index, true);
Chris@43 209 // if ((m_firstPM && (first[m_frameCount - 1] == index)) ||
Chris@43 210 // (!m_firstPM && (m_last[index-1] < m_frameCount)))
Chris@43 211 if (m_first[m_frameCount - 1] == index)
Chris@45 212 setValue(m_frameCount, index, AdvanceThis, min2, dMN);
cannam@0 213 else {
Chris@46 214 float min1 = getValue(m_frameCount - 1, index - 1, true);
cannam@0 215 if (min1 + dMN <= min2)
Chris@45 216 setValue(m_frameCount, index, AdvanceBoth, min1,dMN);
cannam@0 217 else
Chris@45 218 setValue(m_frameCount, index, AdvanceThis, min2,dMN);
cannam@0 219 }
cannam@0 220 } else {
Chris@46 221 float min1 = getValue(m_frameCount, index-1, true);
Chris@46 222 float min2 = getValue(m_frameCount - 1, index, true);
Chris@46 223 float min3 = getValue(m_frameCount - 1, index-1, true);
cannam@0 224 if (min1 <= min2) {
cannam@0 225 if (min3 + dMN <= min1)
Chris@45 226 setValue(m_frameCount, index, AdvanceBoth, min3,dMN);
cannam@0 227 else
Chris@45 228 setValue(m_frameCount, index, AdvanceOther,min1,dMN);
cannam@0 229 } else {
cannam@0 230 if (min3 + dMN <= min2)
Chris@45 231 setValue(m_frameCount, index, AdvanceBoth, min3,dMN);
cannam@0 232 else
Chris@45 233 setValue(m_frameCount, index, AdvanceThis, min2,dMN);
cannam@0 234 }
cannam@0 235 }
Chris@43 236 m_otherMatcher->m_last[index]++;
cannam@0 237 } // loop for row (resp. column)
cannam@0 238
Chris@43 239 m_frameCount++;
Chris@43 240 m_runCount++;
cannam@0 241
Chris@43 242 m_otherMatcher->m_runCount = 0;
Chris@21 243 }
cannam@0 244
Chris@46 245 float
cannam@0 246 Matcher::getValue(int i, int j, bool firstAttempt)
cannam@0 247 {
Chris@43 248 if (m_firstPM)
Chris@43 249 return m_bestPathCost[i][j - m_first[i]];
cannam@0 250 else
Chris@43 251 return m_otherMatcher->m_bestPathCost[j][i - m_otherMatcher->m_first[j]];
cannam@0 252 } // getValue()
cannam@0 253
cannam@0 254 void
Chris@45 255 Matcher::setValue(int i, int j, Advance dir, float value, float dMN)
cannam@0 256 {
Chris@43 257 if (m_firstPM) {
Chris@45 258
Chris@45 259 int jdx = j - m_first[i];
Chris@45 260 m_distance[i][jdx] = dMN;
Chris@45 261 m_advance[i][jdx] = dir;
Chris@45 262 m_bestPathCost[i][jdx] =
Chris@45 263 (value + (dir == AdvanceBoth ? dMN*2: dMN));
Chris@45 264
cannam@0 265 } else {
Chris@45 266
Chris@45 267 if (dir == AdvanceThis) {
Chris@45 268 dir = AdvanceOther;
Chris@45 269 } else if (dir == AdvanceOther) {
Chris@45 270 dir = AdvanceThis;
Chris@45 271 }
Chris@45 272
Chris@43 273 int idx = i - m_otherMatcher->m_first[j];
Chris@45 274
Chris@43 275 if (idx == (int)m_otherMatcher->m_distYSizes[j]) {
cannam@0 276 // This should never happen, but if we allow arbitrary
cannam@0 277 // pauses in either direction, and arbitrary lengths at
cannam@0 278 // end, it is better than a segmentation fault.
cannam@0 279 std::cerr << "Emergency resize: " << idx << " -> " << idx * 2 << std::endl;
Chris@43 280 m_otherMatcher->m_distYSizes[j] = idx * 2;
Chris@43 281 m_otherMatcher->m_bestPathCost[j].resize(idx * 2, 0);
Chris@43 282 m_otherMatcher->m_distance[j].resize(idx * 2, 0);
Chris@46 283 m_otherMatcher->m_advance[j].resize(idx * 2, AdvanceNone);
cannam@0 284 }
Chris@45 285
Chris@45 286 m_otherMatcher->m_distance[j][idx] = dMN;
Chris@45 287 m_otherMatcher->m_advance[j][idx] = dir;
Chris@43 288 m_otherMatcher->m_bestPathCost[j][idx] =
Chris@45 289 (value + (dir == AdvanceBoth ? dMN*2: dMN));
cannam@0 290 }
cannam@0 291 } // setValue()
cannam@0 292