view src/Matcher.cpp @ 46:b0ebc3e2c016 refactors

Some fixes: int -> float
author Chris Cannam
date Thu, 13 Nov 2014 15:09:04 +0000
parents a1b7df871496
children 8cbc15519d2c
line wrap: on
line source
/* -*- c-basic-offset: 4 indent-tabs-mode: nil -*-  vi:set ts=8 sts=4 sw=4: */

/*
    Vamp feature extraction plugin using the MATCH audio alignment
    algorithm.

    Centre for Digital Music, Queen Mary, University of London.
    This file copyright 2007 Simon Dixon, Chris Cannam and QMUL.
    
    This program is free software; you can redistribute it and/or
    modify it under the terms of the GNU General Public License as
    published by the Free Software Foundation; either version 2 of the
    License, or (at your option) any later version.  See the file
    COPYING included with this distribution for more information.
*/

#include "Matcher.h"

#include <iostream>

#include <cstdlib>
#include <cassert>

//#define DEBUG_MATCHER 1

Matcher::Matcher(Parameters parameters,
                 FeatureExtractor::Parameters feParams,
                 Matcher *p) :
    m_params(parameters),
    m_featureExtractor(feParams),
    m_metric(parameters.distanceNorm)
{
#ifdef DEBUG_MATCHER
    cerr << "Matcher::Matcher(" << m_params.sampleRate << ", " << p << ")" << endl;
#endif

    m_otherMatcher = p;	// the first matcher will need this to be set later
    m_firstPM = (!p);
    m_frameCount = 0;
    m_runCount = 0;
    m_featureSize = m_featureExtractor.getFeatureSize();
    m_blockSize = 0;

    m_blockSize = lrint(m_params.blockTime / m_params.hopTime);
#ifdef DEBUG_MATCHER
    cerr << "Matcher: m_blockSize = " << m_blockSize << endl;
#endif

    m_initialised = false;
}

Matcher::Matcher(Parameters parameters, Matcher *p, int m_featureSize_) :
    m_params(parameters),
    m_featureSize(m_featureSize_),
    m_featureExtractor(FeatureExtractor::Parameters(m_params.sampleRate, m_params.fftSize)), // unused default config
    m_metric(parameters.distanceNorm)
{
#ifdef DEBUG_MATCHER
    cerr << "Matcher::Matcher(" << m_params.sampleRate << ", " << p << ", " << m_featureSize << ")" << endl;
#endif

    m_otherMatcher = p;	// the first matcher will need this to be set later
    m_firstPM = (!p);
    m_frameCount = 0;
    m_runCount = 0;
    m_blockSize = 0;

    m_blockSize = lrint(m_params.blockTime / m_params.hopTime);
#ifdef DEBUG_MATCHER
    cerr << "Matcher: m_blockSize = " << m_blockSize << endl;
#endif

    m_initialised = false;
} 

Matcher::~Matcher()
{
#ifdef DEBUG_MATCHER
    cerr << "Matcher(" << this << ")::~Matcher()" << endl;
#endif
}

void
Matcher::init()
{
    if (m_initialised) return;

    m_frames = vector<vector<double> >
        (m_blockSize, vector<double>(m_featureSize, 0));

    m_distXSize = m_blockSize * 2;

    size();

    m_frameCount = 0;
    m_runCount = 0;
    
    m_initialised = true;
}

void
Matcher::size()
{
    int distSize = (m_params.maxRunCount + 1) * m_blockSize;
    m_bestPathCost.resize(m_distXSize, vector<float>(distSize, 0));
    m_distance.resize(m_distXSize, vector<float>(distSize, 0));
    m_advance.resize(m_distXSize, vector<Advance>(distSize, AdvanceNone));
    m_distYSizes.resize(m_distXSize, distSize);
    m_first.resize(m_distXSize, 0);
    m_last.resize(m_distXSize, 0);
}

vector<double>
Matcher::consumeFrame(double *reBuffer, double *imBuffer)
{
    if (!m_initialised) init();

    vector<double> real(reBuffer, reBuffer + m_params.fftSize/2 + 1);
    vector<double> imag(imBuffer, imBuffer + m_params.fftSize/2 + 1);
    vector<double> feature = m_featureExtractor.process(real, imag);
    int frameIndex = m_frameCount % m_blockSize;
    m_frames[frameIndex] = feature;
    calcAdvance();

    return feature;
}

void
Matcher::consumeFeatureVector(std::vector<double> feature)
{
    if (!m_initialised) init();
    int frameIndex = m_frameCount % m_blockSize; 
    m_frames[frameIndex] = feature;
    calcAdvance();
}

void
Matcher::calcAdvance()
{
    int frameIndex = m_frameCount % m_blockSize;

    if (m_frameCount >= m_distXSize) {
        m_distXSize *= 2;
        size();
    }

    if (m_firstPM && (m_frameCount >= m_blockSize)) {

        int len = m_last[m_frameCount - m_blockSize] -
                 m_first[m_frameCount - m_blockSize];

        // We need to copy distance[m_frameCount-m_blockSize] to
        // distance[m_frameCount], and then truncate
        // distance[m_frameCount-m_blockSize] to its first len elements.
        // Same for bestPathCost.
/*
        std::cerr << "Matcher(" << this << "): moving " << distYSizes[m_frameCount - m_blockSize] << " from " << m_frameCount - m_blockSize << " to "
                  << m_frameCount << ", allocating " << len << " for "
                  << m_frameCount - m_blockSize << std::endl;
*/
        m_distance[m_frameCount] = m_distance[m_frameCount - m_blockSize];
        m_distance[m_frameCount - m_blockSize].resize(len, 0);

        m_bestPathCost[m_frameCount] = m_bestPathCost[m_frameCount - m_blockSize];
        m_bestPathCost[m_frameCount - m_blockSize].resize(len, 0);

        m_advance[m_frameCount] = m_advance[m_frameCount - m_blockSize];
        m_advance[m_frameCount - m_blockSize].resize(len, AdvanceNone);
        
        m_distYSizes[m_frameCount] = m_distYSizes[m_frameCount - m_blockSize];
        m_distYSizes[m_frameCount - m_blockSize] = len;
    }

    int stop = m_otherMatcher->m_frameCount;
    int index = stop - m_blockSize;
    if (index < 0)
        index = 0;
    m_first[m_frameCount] = index;
    m_last[m_frameCount] = stop;

    float mn= -1;
    float mx= -1;
    for ( ; index < stop; index++) {

        float dMN = m_metric.calcDistance
            (m_frames[frameIndex],
             m_otherMatcher->m_frames[index % m_blockSize]);
        
        if (mx<0)
            mx = mn = dMN;
        else if (dMN > mx)
            mx = dMN;
        else if (dMN < mn)
            mn = dMN;

        if ((m_frameCount == 0) && (index == 0))    // first element
            setValue(0, 0, AdvanceNone, 0, dMN);
        else if (m_frameCount == 0)                 // first row
            setValue(0, index, AdvanceOther,
                     getValue(0, index-1, true), dMN);
        else if (index == 0)                      // first column
            setValue(m_frameCount, index, AdvanceThis,
                     getValue(m_frameCount - 1, 0, true), dMN);
        else if (index == m_otherMatcher->m_frameCount - m_blockSize) {
            // missing value(s) due to cutoff
            //  - no previous value in current row (resp. column)
            //  - no diagonal value if prev. dir. == curr. dirn
            float min2 = getValue(m_frameCount - 1, index, true);
            //	if ((m_firstPM && (first[m_frameCount - 1] == index)) ||
            //			(!m_firstPM && (m_last[index-1] < m_frameCount)))
            if (m_first[m_frameCount - 1] == index)
                setValue(m_frameCount, index, AdvanceThis, min2, dMN);
            else {
                float min1 = getValue(m_frameCount - 1, index - 1, true);
                if (min1 + dMN <= min2)
                    setValue(m_frameCount, index, AdvanceBoth, min1,dMN);
                else
                    setValue(m_frameCount, index, AdvanceThis, min2,dMN);
            }
        } else {
            float min1 = getValue(m_frameCount, index-1, true);
            float min2 = getValue(m_frameCount - 1, index, true);
            float min3 = getValue(m_frameCount - 1, index-1, true);
            if (min1 <= min2) {
                if (min3 + dMN <= min1)
                    setValue(m_frameCount, index, AdvanceBoth, min3,dMN);
                else
                    setValue(m_frameCount, index, AdvanceOther,min1,dMN);
            } else {
                if (min3 + dMN <= min2)
                    setValue(m_frameCount, index, AdvanceBoth, min3,dMN);
                else
                    setValue(m_frameCount, index, AdvanceThis, min2,dMN);
            }
        }
        m_otherMatcher->m_last[index]++;
    } // loop for row (resp. column)

    m_frameCount++;
    m_runCount++;

    m_otherMatcher->m_runCount = 0;
}

float
Matcher::getValue(int i, int j, bool firstAttempt)
{
    if (m_firstPM)
        return m_bestPathCost[i][j - m_first[i]];
    else
        return m_otherMatcher->m_bestPathCost[j][i - m_otherMatcher->m_first[j]];
} // getValue()

void
Matcher::setValue(int i, int j, Advance dir, float value, float dMN)
{
    if (m_firstPM) {

        int jdx = j - m_first[i];
        m_distance[i][jdx] = dMN;
        m_advance[i][jdx] = dir;
        m_bestPathCost[i][jdx] =
            (value + (dir == AdvanceBoth ? dMN*2: dMN));

    } else {

        if (dir == AdvanceThis) {
            dir = AdvanceOther;
        } else if (dir == AdvanceOther) {
            dir = AdvanceThis;
        }

        int idx = i - m_otherMatcher->m_first[j];
        
        if (idx == (int)m_otherMatcher->m_distYSizes[j]) {
            // This should never happen, but if we allow arbitrary
            // pauses in either direction, and arbitrary lengths at
            // end, it is better than a segmentation fault.
            std::cerr << "Emergency resize: " << idx << " -> " << idx * 2 << std::endl;
            m_otherMatcher->m_distYSizes[j] = idx * 2;
            m_otherMatcher->m_bestPathCost[j].resize(idx * 2, 0);
            m_otherMatcher->m_distance[j].resize(idx * 2, 0);
            m_otherMatcher->m_advance[j].resize(idx * 2, AdvanceNone);
        }

        m_otherMatcher->m_distance[j][idx] = dMN;
        m_otherMatcher->m_advance[j][idx] = dir;
        m_otherMatcher->m_bestPathCost[j][idx] =
            (value + (dir == AdvanceBoth ? dMN*2: dMN));
    }
} // setValue()