annotate src/Matcher.cpp @ 45:a1b7df871496 refactors

Replace char dist (inc dir in masked section) with float dist + separate dir
author Chris Cannam
date Thu, 13 Nov 2014 14:43:03 +0000
parents 6a5d165e5ea4
children b0ebc3e2c016
rev   line source
cannam@0 1 /* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */
cannam@0 2
cannam@0 3 /*
cannam@0 4 Vamp feature extraction plugin using the MATCH audio alignment
cannam@0 5 algorithm.
cannam@0 6
cannam@0 7 Centre for Digital Music, Queen Mary, University of London.
cannam@0 8 This file copyright 2007 Simon Dixon, Chris Cannam and QMUL.
cannam@0 9
cannam@0 10 This program is free software; you can redistribute it and/or
cannam@0 11 modify it under the terms of the GNU General Public License as
cannam@0 12 published by the Free Software Foundation; either version 2 of the
cannam@0 13 License, or (at your option) any later version. See the file
cannam@0 14 COPYING included with this distribution for more information.
cannam@0 15 */
cannam@0 16
cannam@0 17 #include "Matcher.h"
cannam@0 18
cannam@0 19 #include <iostream>
cannam@0 20
cannam@4 21 #include <cstdlib>
Chris@16 22 #include <cassert>
cannam@4 23
Chris@10 24 //#define DEBUG_MATCHER 1
Chris@10 25
Chris@38 26 Matcher::Matcher(Parameters parameters,
Chris@38 27 FeatureExtractor::Parameters feParams,
Chris@38 28 Matcher *p) :
Chris@43 29 m_params(parameters),
Chris@43 30 m_featureExtractor(feParams),
Chris@43 31 m_metric(parameters.distanceNorm)
cannam@0 32 {
Chris@10 33 #ifdef DEBUG_MATCHER
Chris@43 34 cerr << "Matcher::Matcher(" << m_params.sampleRate << ", " << p << ")" << endl;
Chris@10 35 #endif
cannam@0 36
Chris@43 37 m_otherMatcher = p; // the first matcher will need this to be set later
Chris@43 38 m_firstPM = (!p);
Chris@43 39 m_frameCount = 0;
Chris@43 40 m_runCount = 0;
Chris@43 41 m_featureSize = m_featureExtractor.getFeatureSize();
Chris@43 42 m_blockSize = 0;
Chris@23 43
Chris@43 44 m_blockSize = lrint(m_params.blockTime / m_params.hopTime);
Chris@23 45 #ifdef DEBUG_MATCHER
Chris@43 46 cerr << "Matcher: m_blockSize = " << m_blockSize << endl;
Chris@23 47 #endif
Chris@23 48
Chris@43 49 m_initialised = false;
Chris@23 50 }
Chris@23 51
Chris@43 52 Matcher::Matcher(Parameters parameters, Matcher *p, int m_featureSize_) :
Chris@43 53 m_params(parameters),
Chris@43 54 m_featureSize(m_featureSize_),
Chris@43 55 m_featureExtractor(FeatureExtractor::Parameters(m_params.sampleRate, m_params.fftSize)), // unused default config
Chris@43 56 m_metric(parameters.distanceNorm)
Chris@23 57 {
Chris@23 58 #ifdef DEBUG_MATCHER
Chris@43 59 cerr << "Matcher::Matcher(" << m_params.sampleRate << ", " << p << ", " << m_featureSize << ")" << endl;
Chris@23 60 #endif
Chris@23 61
Chris@43 62 m_otherMatcher = p; // the first matcher will need this to be set later
Chris@43 63 m_firstPM = (!p);
Chris@43 64 m_frameCount = 0;
Chris@43 65 m_runCount = 0;
Chris@43 66 m_blockSize = 0;
cannam@0 67
Chris@43 68 m_blockSize = lrint(m_params.blockTime / m_params.hopTime);
Chris@15 69 #ifdef DEBUG_MATCHER
Chris@43 70 cerr << "Matcher: m_blockSize = " << m_blockSize << endl;
Chris@15 71 #endif
cannam@0 72
Chris@43 73 m_initialised = false;
Chris@23 74 }
cannam@0 75
cannam@0 76 Matcher::~Matcher()
cannam@0 77 {
Chris@10 78 #ifdef DEBUG_MATCHER
Chris@15 79 cerr << "Matcher(" << this << ")::~Matcher()" << endl;
Chris@10 80 #endif
cannam@0 81 }
cannam@0 82
cannam@0 83 void
cannam@0 84 Matcher::init()
cannam@0 85 {
Chris@43 86 if (m_initialised) return;
cannam@0 87
Chris@43 88 m_frames = vector<vector<double> >
Chris@43 89 (m_blockSize, vector<double>(m_featureSize, 0));
cannam@0 90
Chris@43 91 m_distXSize = m_blockSize * 2;
Chris@45 92
Chris@41 93 size();
cannam@0 94
Chris@43 95 m_frameCount = 0;
Chris@43 96 m_runCount = 0;
Chris@38 97
Chris@43 98 m_initialised = true;
Chris@16 99 }
Chris@16 100
cannam@0 101 void
Chris@41 102 Matcher::size()
cannam@0 103 {
Chris@43 104 int distSize = (m_params.maxRunCount + 1) * m_blockSize;
Chris@45 105 m_bestPathCost.resize(m_distXSize, vector<float>(distSize, 0));
Chris@45 106 m_distance.resize(m_distXSize, vector<float>(distSize, 0));
Chris@45 107 m_advance.resize(m_distXSize, vector<Advance>(distSize, AdvanceNone));
Chris@43 108 m_distYSizes.resize(m_distXSize, distSize);
Chris@43 109 m_first.resize(m_distXSize, 0);
Chris@43 110 m_last.resize(m_distXSize, 0);
Chris@38 111 }
cannam@0 112
Chris@14 113 vector<double>
Chris@21 114 Matcher::consumeFrame(double *reBuffer, double *imBuffer)
cannam@0 115 {
Chris@43 116 if (!m_initialised) init();
cannam@0 117
Chris@43 118 vector<double> real(reBuffer, reBuffer + m_params.fftSize/2 + 1);
Chris@43 119 vector<double> imag(imBuffer, imBuffer + m_params.fftSize/2 + 1);
Chris@43 120 vector<double> feature = m_featureExtractor.process(real, imag);
Chris@43 121 int frameIndex = m_frameCount % m_blockSize;
Chris@43 122 m_frames[frameIndex] = feature;
Chris@21 123 calcAdvance();
Chris@21 124
Chris@38 125 return feature;
Chris@23 126 }
Chris@21 127
Chris@23 128 void
Chris@23 129 Matcher::consumeFeatureVector(std::vector<double> feature)
Chris@23 130 {
Chris@43 131 if (!m_initialised) init();
Chris@43 132 int frameIndex = m_frameCount % m_blockSize;
Chris@43 133 m_frames[frameIndex] = feature;
Chris@23 134 calcAdvance();
Chris@21 135 }
Chris@21 136
Chris@21 137 void
Chris@21 138 Matcher::calcAdvance()
Chris@21 139 {
Chris@43 140 int frameIndex = m_frameCount % m_blockSize;
Chris@21 141
Chris@43 142 if (m_frameCount >= m_distXSize) {
Chris@43 143 m_distXSize *= 2;
Chris@41 144 size();
cannam@0 145 }
cannam@0 146
Chris@43 147 if (m_firstPM && (m_frameCount >= m_blockSize)) {
cannam@0 148
Chris@43 149 int len = m_last[m_frameCount - m_blockSize] -
Chris@43 150 m_first[m_frameCount - m_blockSize];
cannam@0 151
Chris@43 152 // We need to copy distance[m_frameCount-m_blockSize] to
Chris@43 153 // distance[m_frameCount], and then truncate
Chris@43 154 // distance[m_frameCount-m_blockSize] to its first len elements.
cannam@0 155 // Same for bestPathCost.
cannam@0 156 /*
Chris@43 157 std::cerr << "Matcher(" << this << "): moving " << distYSizes[m_frameCount - m_blockSize] << " from " << m_frameCount - m_blockSize << " to "
Chris@43 158 << m_frameCount << ", allocating " << len << " for "
Chris@43 159 << m_frameCount - m_blockSize << std::endl;
cannam@0 160 */
Chris@43 161 m_distance[m_frameCount] = m_distance[m_frameCount - m_blockSize];
Chris@43 162 m_distance[m_frameCount - m_blockSize].resize(len, 0);
cannam@0 163
Chris@43 164 m_bestPathCost[m_frameCount] = m_bestPathCost[m_frameCount - m_blockSize];
Chris@43 165 m_bestPathCost[m_frameCount - m_blockSize].resize(len, 0);
cannam@0 166
Chris@45 167 m_advance[m_frameCount] = m_advance[m_frameCount - m_blockSize];
Chris@45 168 m_advance[m_frameCount - m_blockSize].resize(len);
Chris@45 169
Chris@43 170 m_distYSizes[m_frameCount] = m_distYSizes[m_frameCount - m_blockSize];
Chris@43 171 m_distYSizes[m_frameCount - m_blockSize] = len;
cannam@0 172 }
cannam@0 173
Chris@43 174 int stop = m_otherMatcher->m_frameCount;
Chris@43 175 int index = stop - m_blockSize;
cannam@0 176 if (index < 0)
cannam@0 177 index = 0;
Chris@43 178 m_first[m_frameCount] = index;
Chris@43 179 m_last[m_frameCount] = stop;
cannam@0 180
cannam@0 181 bool overflow = false;
cannam@0 182 int mn= -1;
cannam@0 183 int mx= -1;
cannam@0 184 for ( ; index < stop; index++) {
Chris@26 185
Chris@45 186 float dMN = m_metric.calcDistance
Chris@43 187 (m_frames[frameIndex],
Chris@45 188 m_otherMatcher->m_frames[index % m_blockSize]);
Chris@26 189
cannam@0 190 if (mx<0)
cannam@0 191 mx = mn = dMN;
cannam@0 192 else if (dMN > mx)
cannam@0 193 mx = dMN;
cannam@0 194 else if (dMN < mn)
cannam@0 195 mn = dMN;
cannam@0 196 if (dMN >= 255) {
cannam@0 197 overflow = true;
cannam@0 198 dMN = 255;
cannam@0 199 }
Chris@26 200
Chris@43 201 if ((m_frameCount == 0) && (index == 0)) // first element
Chris@45 202 setValue(0, 0, AdvanceNone, 0, dMN);
Chris@43 203 else if (m_frameCount == 0) // first row
Chris@45 204 setValue(0, index, AdvanceOther,
cannam@0 205 getValue(0, index-1, true), dMN);
cannam@0 206 else if (index == 0) // first column
Chris@45 207 setValue(m_frameCount, index, AdvanceThis,
Chris@43 208 getValue(m_frameCount - 1, 0, true), dMN);
Chris@43 209 else if (index == m_otherMatcher->m_frameCount - m_blockSize) {
cannam@0 210 // missing value(s) due to cutoff
cannam@0 211 // - no previous value in current row (resp. column)
cannam@0 212 // - no diagonal value if prev. dir. == curr. dirn
Chris@43 213 int min2 = getValue(m_frameCount - 1, index, true);
Chris@43 214 // if ((m_firstPM && (first[m_frameCount - 1] == index)) ||
Chris@43 215 // (!m_firstPM && (m_last[index-1] < m_frameCount)))
Chris@43 216 if (m_first[m_frameCount - 1] == index)
Chris@45 217 setValue(m_frameCount, index, AdvanceThis, min2, dMN);
cannam@0 218 else {
Chris@43 219 int min1 = getValue(m_frameCount - 1, index - 1, true);
cannam@0 220 if (min1 + dMN <= min2)
Chris@45 221 setValue(m_frameCount, index, AdvanceBoth, min1,dMN);
cannam@0 222 else
Chris@45 223 setValue(m_frameCount, index, AdvanceThis, min2,dMN);
cannam@0 224 }
cannam@0 225 } else {
Chris@43 226 int min1 = getValue(m_frameCount, index-1, true);
Chris@43 227 int min2 = getValue(m_frameCount - 1, index, true);
Chris@43 228 int min3 = getValue(m_frameCount - 1, index-1, true);
cannam@0 229 if (min1 <= min2) {
cannam@0 230 if (min3 + dMN <= min1)
Chris@45 231 setValue(m_frameCount, index, AdvanceBoth, min3,dMN);
cannam@0 232 else
Chris@45 233 setValue(m_frameCount, index, AdvanceOther,min1,dMN);
cannam@0 234 } else {
cannam@0 235 if (min3 + dMN <= min2)
Chris@45 236 setValue(m_frameCount, index, AdvanceBoth, min3,dMN);
cannam@0 237 else
Chris@45 238 setValue(m_frameCount, index, AdvanceThis, min2,dMN);
cannam@0 239 }
cannam@0 240 }
Chris@43 241 m_otherMatcher->m_last[index]++;
cannam@0 242 } // loop for row (resp. column)
cannam@0 243
Chris@43 244 m_frameCount++;
Chris@43 245 m_runCount++;
cannam@0 246
Chris@43 247 m_otherMatcher->m_runCount = 0;
cannam@0 248
Chris@43 249 if (overflow) {
cannam@0 250 cerr << "WARNING: overflow in distance metric: "
Chris@43 251 << "frame " << m_frameCount << ", val = " << mx << endl;
Chris@43 252 }
Chris@21 253 }
cannam@0 254
cannam@0 255 int
cannam@0 256 Matcher::getValue(int i, int j, bool firstAttempt)
cannam@0 257 {
Chris@43 258 if (m_firstPM)
Chris@43 259 return m_bestPathCost[i][j - m_first[i]];
cannam@0 260 else
Chris@43 261 return m_otherMatcher->m_bestPathCost[j][i - m_otherMatcher->m_first[j]];
cannam@0 262 } // getValue()
cannam@0 263
cannam@0 264 void
Chris@45 265 Matcher::setValue(int i, int j, Advance dir, float value, float dMN)
cannam@0 266 {
Chris@43 267 if (m_firstPM) {
Chris@45 268
Chris@45 269 int jdx = j - m_first[i];
Chris@45 270 m_distance[i][jdx] = dMN;
Chris@45 271 m_advance[i][jdx] = dir;
Chris@45 272 m_bestPathCost[i][jdx] =
Chris@45 273 (value + (dir == AdvanceBoth ? dMN*2: dMN));
Chris@45 274
cannam@0 275 } else {
Chris@45 276
Chris@45 277 if (dir == AdvanceThis) {
Chris@45 278 dir = AdvanceOther;
Chris@45 279 } else if (dir == AdvanceOther) {
Chris@45 280 dir = AdvanceThis;
Chris@45 281 }
Chris@45 282
Chris@43 283 int idx = i - m_otherMatcher->m_first[j];
Chris@45 284
Chris@43 285 if (idx == (int)m_otherMatcher->m_distYSizes[j]) {
cannam@0 286 // This should never happen, but if we allow arbitrary
cannam@0 287 // pauses in either direction, and arbitrary lengths at
cannam@0 288 // end, it is better than a segmentation fault.
cannam@0 289 std::cerr << "Emergency resize: " << idx << " -> " << idx * 2 << std::endl;
Chris@43 290 m_otherMatcher->m_distYSizes[j] = idx * 2;
Chris@43 291 m_otherMatcher->m_bestPathCost[j].resize(idx * 2, 0);
Chris@43 292 m_otherMatcher->m_distance[j].resize(idx * 2, 0);
cannam@0 293 }
Chris@45 294
Chris@45 295 m_otherMatcher->m_distance[j][idx] = dMN;
Chris@45 296 m_otherMatcher->m_advance[j][idx] = dir;
Chris@43 297 m_otherMatcher->m_bestPathCost[j][idx] =
Chris@45 298 (value + (dir == AdvanceBoth ? dMN*2: dMN));
cannam@0 299 }
cannam@0 300 } // setValue()
cannam@0 301