Mercurial > hg > match-vamp
view src/Matcher.cpp @ 53:331a17753663 refactors
If the distance metric is a float, the total path cost should be a double (otherwise discriminatory precision is lost as the overall total accumulates)
author | Chris Cannam |
---|---|
date | Fri, 14 Nov 2014 10:09:10 +0000 |
parents | 8cbc15519d2c |
children | 30567d4fb83a 696f6e7f2f31 |
line wrap: on
line source
/* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */ /* Vamp feature extraction plugin using the MATCH audio alignment algorithm. Centre for Digital Music, Queen Mary, University of London. This file copyright 2007 Simon Dixon, Chris Cannam and QMUL. This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 2 of the License, or (at your option) any later version. See the file COPYING included with this distribution for more information. */ #include "Matcher.h" #include <iostream> #include <cstdlib> #include <cassert> //#define DEBUG_MATCHER 1 Matcher::Matcher(Parameters parameters, FeatureExtractor::Parameters feParams, Matcher *p) : m_params(parameters), m_featureExtractor(feParams), m_metric(parameters.distanceNorm) { #ifdef DEBUG_MATCHER cerr << "Matcher::Matcher(" << m_params.sampleRate << ", " << p << ")" << endl; #endif m_otherMatcher = p; // the first matcher will need this to be set later m_firstPM = (!p); m_frameCount = 0; m_runCount = 0; m_featureSize = m_featureExtractor.getFeatureSize(); m_blockSize = 0; m_blockSize = lrint(m_params.blockTime / m_params.hopTime); #ifdef DEBUG_MATCHER cerr << "Matcher: m_blockSize = " << m_blockSize << endl; #endif m_initialised = false; } Matcher::Matcher(Parameters parameters, Matcher *p, int m_featureSize_) : m_params(parameters), m_featureSize(m_featureSize_), m_featureExtractor(FeatureExtractor::Parameters(m_params.sampleRate, m_params.fftSize)), // unused default config m_metric(parameters.distanceNorm) { #ifdef DEBUG_MATCHER cerr << "Matcher::Matcher(" << m_params.sampleRate << ", " << p << ", " << m_featureSize << ")" << endl; #endif m_otherMatcher = p; // the first matcher will need this to be set later m_firstPM = (!p); m_frameCount = 0; m_runCount = 0; m_blockSize = 0; m_blockSize = lrint(m_params.blockTime / m_params.hopTime); #ifdef DEBUG_MATCHER cerr << "Matcher: m_blockSize = " << m_blockSize << endl; #endif m_initialised = false; } Matcher::~Matcher() { #ifdef DEBUG_MATCHER cerr << "Matcher(" << this << ")::~Matcher()" << endl; #endif } void Matcher::init() { if (m_initialised) return; m_frames = vector<vector<double> > (m_blockSize, vector<double>(m_featureSize, 0)); m_distXSize = m_blockSize * 2; size(); m_frameCount = 0; m_runCount = 0; m_initialised = true; } void Matcher::size() { int distSize = (m_params.maxRunCount + 1) * m_blockSize; m_bestPathCost.resize(m_distXSize, vector<double>(distSize, 0)); m_distance.resize(m_distXSize, vector<float>(distSize, 0)); m_advance.resize(m_distXSize, vector<Advance>(distSize, AdvanceNone)); m_distYSizes.resize(m_distXSize, distSize); m_first.resize(m_distXSize, 0); m_last.resize(m_distXSize, 0); } vector<double> Matcher::consumeFrame(double *reBuffer, double *imBuffer) { if (!m_initialised) init(); vector<double> real(reBuffer, reBuffer + m_params.fftSize/2 + 1); vector<double> imag(imBuffer, imBuffer + m_params.fftSize/2 + 1); vector<double> feature = m_featureExtractor.process(real, imag); int frameIndex = m_frameCount % m_blockSize; m_frames[frameIndex] = feature; calcAdvance(); return feature; } void Matcher::consumeFeatureVector(std::vector<double> feature) { if (!m_initialised) init(); int frameIndex = m_frameCount % m_blockSize; m_frames[frameIndex] = feature; calcAdvance(); } void Matcher::calcAdvance() { int frameIndex = m_frameCount % m_blockSize; if (m_frameCount >= m_distXSize) { m_distXSize *= 2; size(); } if (m_firstPM && (m_frameCount >= m_blockSize)) { int len = m_last[m_frameCount - m_blockSize] - m_first[m_frameCount - m_blockSize]; // We need to copy distance[m_frameCount-m_blockSize] to // distance[m_frameCount], and then truncate // distance[m_frameCount-m_blockSize] to its first len elements. // Same for bestPathCost. /* std::cerr << "Matcher(" << this << "): moving " << distYSizes[m_frameCount - m_blockSize] << " from " << m_frameCount - m_blockSize << " to " << m_frameCount << ", allocating " << len << " for " << m_frameCount - m_blockSize << std::endl; */ m_distance[m_frameCount] = m_distance[m_frameCount - m_blockSize]; m_distance[m_frameCount - m_blockSize].resize(len, 0); m_bestPathCost[m_frameCount] = m_bestPathCost[m_frameCount - m_blockSize]; m_bestPathCost[m_frameCount - m_blockSize].resize(len, 0); m_advance[m_frameCount] = m_advance[m_frameCount - m_blockSize]; m_advance[m_frameCount - m_blockSize].resize(len, AdvanceNone); m_distYSizes[m_frameCount] = m_distYSizes[m_frameCount - m_blockSize]; m_distYSizes[m_frameCount - m_blockSize] = len; } int stop = m_otherMatcher->m_frameCount; int index = stop - m_blockSize; if (index < 0) index = 0; m_first[m_frameCount] = index; m_last[m_frameCount] = stop; float mn= -1; float mx= -1; for ( ; index < stop; index++) { float dMN = (float) m_metric.calcDistance (m_frames[frameIndex], m_otherMatcher->m_frames[index % m_blockSize]); if (mx<0) mx = mn = dMN; else if (dMN > mx) mx = dMN; else if (dMN < mn) mn = dMN; if ((m_frameCount == 0) && (index == 0)) // first element setValue(0, 0, AdvanceNone, 0, dMN); else if (m_frameCount == 0) // first row setValue(0, index, AdvanceOther, getValue(0, index-1, true), dMN); else if (index == 0) // first column setValue(m_frameCount, index, AdvanceThis, getValue(m_frameCount - 1, 0, true), dMN); else if (index == m_otherMatcher->m_frameCount - m_blockSize) { // missing value(s) due to cutoff // - no previous value in current row (resp. column) // - no diagonal value if prev. dir. == curr. dirn double min2 = getValue(m_frameCount - 1, index, true); // if ((m_firstPM && (first[m_frameCount - 1] == index)) || // (!m_firstPM && (m_last[index-1] < m_frameCount))) if (m_first[m_frameCount - 1] == index) setValue(m_frameCount, index, AdvanceThis, min2, dMN); else { double min1 = getValue(m_frameCount - 1, index - 1, true); if (min1 + dMN <= min2) setValue(m_frameCount, index, AdvanceBoth, min1,dMN); else setValue(m_frameCount, index, AdvanceThis, min2,dMN); } } else { double min1 = getValue(m_frameCount, index-1, true); double min2 = getValue(m_frameCount - 1, index, true); double min3 = getValue(m_frameCount - 1, index-1, true); if (min1 <= min2) { if (min3 + dMN <= min1) setValue(m_frameCount, index, AdvanceBoth, min3,dMN); else setValue(m_frameCount, index, AdvanceOther,min1,dMN); } else { if (min3 + dMN <= min2) setValue(m_frameCount, index, AdvanceBoth, min3,dMN); else setValue(m_frameCount, index, AdvanceThis, min2,dMN); } } m_otherMatcher->m_last[index]++; } // loop for row (resp. column) m_frameCount++; m_runCount++; m_otherMatcher->m_runCount = 0; } double Matcher::getValue(int i, int j, bool firstAttempt) { if (m_firstPM) return m_bestPathCost[i][j - m_first[i]]; else return m_otherMatcher->m_bestPathCost[j][i - m_otherMatcher->m_first[j]]; } // getValue() void Matcher::setValue(int i, int j, Advance dir, double value, float dMN) { if (m_firstPM) { int jdx = j - m_first[i]; m_distance[i][jdx] = dMN; m_advance[i][jdx] = dir; m_bestPathCost[i][jdx] = (value + (dir == AdvanceBoth ? dMN*2: dMN)); } else { if (dir == AdvanceThis) { dir = AdvanceOther; } else if (dir == AdvanceOther) { dir = AdvanceThis; } int idx = i - m_otherMatcher->m_first[j]; if (idx == (int)m_otherMatcher->m_distYSizes[j]) { // This should never happen, but if we allow arbitrary // pauses in either direction, and arbitrary lengths at // end, it is better than a segmentation fault. std::cerr << "Emergency resize: " << idx << " -> " << idx * 2 << std::endl; m_otherMatcher->m_distYSizes[j] = idx * 2; m_otherMatcher->m_bestPathCost[j].resize(idx * 2, 0); m_otherMatcher->m_distance[j].resize(idx * 2, 0); m_otherMatcher->m_advance[j].resize(idx * 2, AdvanceNone); } m_otherMatcher->m_distance[j][idx] = dMN; m_otherMatcher->m_advance[j][idx] = dir; m_otherMatcher->m_bestPathCost[j][idx] = (value + (dir == AdvanceBoth ? dMN*2: dMN)); } } // setValue()