Mercurial > hg > pyin
view MonoNote.cpp @ 146:8404827a4b02 memory
Avoid calculating a temporary obsprob matrix for note tracking; + some tidying
author | Chris Cannam |
---|---|
date | Wed, 17 May 2017 14:50:10 +0100 |
parents | 83978b93aac1 |
children | 729cc1da9b8d |
line wrap: on
line source
/* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */ /* pYIN - A fundamental frequency estimator for monophonic audio Centre for Digital Music, Queen Mary, University of London. This program is free software; you can redistribute it and/or modify it under the terms of the GNU General Public License as published by the Free Software Foundation; either version 2 of the License, or (at your option) any later version. See the file COPYING included with this distribution for more information. */ #include "MonoNote.h" #include <vector> #include <cstdio> #include <cmath> #include <complex> using std::vector; using std::pair; MonoNote::MonoNote() : hmm(0) { } MonoNote::~MonoNote() { } const vector<MonoNote::FrameOutput> MonoNote::process(const vector<vector<pair<double, double> > > pitchProb) { // Previously, this built up a single matrix of probabilities, by // calling calculateObsProb to get a column for each frame in // pitchProb. // // The number of distinct states depends on MonoNoteParameters, // but the defaults have 3 states per pitch, 3 pitches per MIDI // note, and 69 MIDI notes, giving 681 states per frame. With a // frame step size of 256 at 44100Hz sample rate, a 3-minute song // has about 30K frames leading to a 20 million element // probability matrix. // // Since the matrix is very sparse, we can avoid some of this by // feeding the (sparse implementation of) HMM one column at a // time. vector<int> path; if (!pitchProb.empty()) { hmm.initialise(hmm.calculateObsProb(pitchProb[0])); for (size_t iFrame = 1; iFrame < pitchProb.size(); ++iFrame) { hmm.process(hmm.calculateObsProb(pitchProb[iFrame])); } path = hmm.track(); } vector<MonoNote::FrameOutput> out; for (size_t iFrame = 0; iFrame < path.size(); ++iFrame) { double currPitch = -1; int stateKind = 0; currPitch = hmm.par.minPitch + (path[iFrame]/hmm.par.nSPP) * 1.0/hmm.par.nPPS; stateKind = (path[iFrame]) % hmm.par.nSPP + 1; out.push_back(FrameOutput(iFrame, currPitch, stateKind)); } return(out); }