annotate CepstrumPitchTracker.cpp @ 25:9aee1a0e6223

Simplify confidence metric
author Chris Cannam
date Tue, 10 Jul 2012 22:16:00 +0100
parents 0c45cca1e4fd
children 13568f1ccff0
rev   line source
Chris@3 1 /* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */
Chris@3 2 /*
Chris@3 3 Permission is hereby granted, free of charge, to any person
Chris@3 4 obtaining a copy of this software and associated documentation
Chris@3 5 files (the "Software"), to deal in the Software without
Chris@3 6 restriction, including without limitation the rights to use, copy,
Chris@3 7 modify, merge, publish, distribute, sublicense, and/or sell copies
Chris@3 8 of the Software, and to permit persons to whom the Software is
Chris@3 9 furnished to do so, subject to the following conditions:
Chris@3 10
Chris@3 11 The above copyright notice and this permission notice shall be
Chris@3 12 included in all copies or substantial portions of the Software.
Chris@3 13
Chris@3 14 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
Chris@3 15 EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
Chris@3 16 MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
Chris@3 17 NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS BE LIABLE FOR
Chris@3 18 ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF
Chris@3 19 CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
Chris@3 20 WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
Chris@3 21 */
Chris@3 22
Chris@3 23 #include "CepstrumPitchTracker.h"
Chris@3 24
Chris@3 25 #include <vector>
Chris@3 26 #include <algorithm>
Chris@3 27
Chris@3 28 #include <cstdio>
Chris@3 29 #include <cmath>
Chris@3 30 #include <complex>
Chris@3 31
Chris@3 32 using std::string;
Chris@7 33 using std::vector;
Chris@16 34 using Vamp::RealTime;
Chris@7 35
Chris@8 36 CepstrumPitchTracker::Hypothesis::Hypothesis()
Chris@7 37 {
Chris@8 38 m_state = New;
Chris@7 39 m_age = 0;
Chris@7 40 }
Chris@7 41
Chris@11 42 CepstrumPitchTracker::Hypothesis::~Hypothesis()
Chris@11 43 {
Chris@11 44 }
Chris@11 45
Chris@7 46 bool
Chris@7 47 CepstrumPitchTracker::Hypothesis::isWithinTolerance(Estimate s)
Chris@7 48 {
Chris@7 49 if (m_pending.empty()) {
Chris@7 50 return true;
Chris@7 51 }
Chris@16 52
Chris@16 53 // check we are within a relatively close tolerance of the last
Chris@16 54 // candidate
Chris@17 55 Estimate last = m_pending[m_pending.size()-1];
Chris@7 56 double r = s.freq / last.freq;
Chris@7 57 int cents = lrint(1200.0 * (log(r) / log(2.0)));
Chris@17 58 if (cents < -60 || cents > 60) return false;
Chris@16 59
Chris@17 60 // and within a slightly bigger tolerance of the current mean
Chris@17 61 double meanFreq = getMeanFrequency();
Chris@17 62 r = s.freq / meanFreq;
Chris@16 63 cents = lrint(1200.0 * (log(r) / log(2.0)));
Chris@16 64 if (cents < -80 || cents > 80) return false;
Chris@16 65
Chris@16 66 return true;
Chris@7 67 }
Chris@7 68
Chris@7 69 bool
Chris@7 70 CepstrumPitchTracker::Hypothesis::isSatisfied()
Chris@7 71 {
Chris@15 72 if (m_pending.empty()) return false;
Chris@15 73
Chris@15 74 double meanConfidence = 0.0;
Chris@15 75 for (int i = 0; i < m_pending.size(); ++i) {
Chris@15 76 meanConfidence += m_pending[i].confidence;
Chris@15 77 }
Chris@15 78 meanConfidence /= m_pending.size();
Chris@15 79
Chris@25 80 int lengthRequired = 10000;
Chris@25 81 if (meanConfidence > 0.0) {
Chris@25 82 lengthRequired = int(2.0 / meanConfidence + 0.5);
Chris@25 83 }
Chris@15 84 std::cerr << "meanConfidence = " << meanConfidence << ", lengthRequired = " << lengthRequired << ", length = " << m_pending.size() << std::endl;
Chris@15 85
Chris@15 86 return (m_pending.size() > lengthRequired);
Chris@7 87 }
Chris@7 88
Chris@8 89 void
Chris@8 90 CepstrumPitchTracker::Hypothesis::advanceTime()
Chris@8 91 {
Chris@8 92 ++m_age;
Chris@8 93 }
Chris@8 94
Chris@7 95 bool
Chris@7 96 CepstrumPitchTracker::Hypothesis::test(Estimate s)
Chris@7 97 {
Chris@8 98 bool accept = false;
Chris@8 99
Chris@8 100 switch (m_state) {
Chris@8 101
Chris@8 102 case New:
Chris@8 103 m_state = Provisional;
Chris@8 104 accept = true;
Chris@8 105 break;
Chris@8 106
Chris@8 107 case Provisional:
Chris@8 108 if (m_age > 3) {
Chris@8 109 m_state = Rejected;
Chris@8 110 } else if (isWithinTolerance(s)) {
Chris@8 111 accept = true;
Chris@8 112 }
Chris@8 113 break;
Chris@8 114
Chris@8 115 case Satisfied:
Chris@8 116 if (m_age > 3) {
Chris@8 117 m_state = Expired;
Chris@8 118 } else if (isWithinTolerance(s)) {
Chris@8 119 accept = true;
Chris@8 120 }
Chris@8 121 break;
Chris@8 122
Chris@8 123 case Rejected:
Chris@8 124 break;
Chris@8 125
Chris@8 126 case Expired:
Chris@8 127 break;
Chris@7 128 }
Chris@7 129
Chris@8 130 if (accept) {
Chris@8 131 m_pending.push_back(s);
Chris@8 132 m_age = 0;
Chris@8 133 if (m_state == Provisional && isSatisfied()) {
Chris@8 134 m_state = Satisfied;
Chris@7 135 }
Chris@7 136 }
Chris@7 137
Chris@14 138 return accept && (m_state == Satisfied);
Chris@8 139 }
Chris@7 140
Chris@7 141 CepstrumPitchTracker::Hypothesis::State
Chris@7 142 CepstrumPitchTracker::Hypothesis::getState()
Chris@7 143 {
Chris@7 144 return m_state;
Chris@7 145 }
Chris@7 146
Chris@12 147 int
Chris@12 148 CepstrumPitchTracker::Hypothesis::getPendingLength()
Chris@12 149 {
Chris@12 150 return m_pending.size();
Chris@12 151 }
Chris@12 152
Chris@7 153 CepstrumPitchTracker::Hypothesis::Estimates
Chris@7 154 CepstrumPitchTracker::Hypothesis::getAcceptedEstimates()
Chris@7 155 {
Chris@7 156 if (m_state == Satisfied || m_state == Expired) {
Chris@7 157 return m_pending;
Chris@7 158 } else {
Chris@7 159 return Estimates();
Chris@7 160 }
Chris@7 161 }
Chris@7 162
Chris@17 163 double
Chris@17 164 CepstrumPitchTracker::Hypothesis::getMeanFrequency()
Chris@17 165 {
Chris@17 166 double acc = 0.0;
Chris@17 167 for (int i = 0; i < m_pending.size(); ++i) {
Chris@17 168 acc += m_pending[i].freq;
Chris@17 169 }
Chris@17 170 acc /= m_pending.size();
Chris@17 171 return acc;
Chris@17 172 }
Chris@17 173
Chris@16 174 CepstrumPitchTracker::Hypothesis::Note
Chris@16 175 CepstrumPitchTracker::Hypothesis::getAveragedNote()
Chris@16 176 {
Chris@16 177 Note n;
Chris@16 178
Chris@16 179 if (!(m_state == Satisfied || m_state == Expired)) {
Chris@16 180 n.freq = 0.0;
Chris@16 181 n.time = RealTime::zeroTime;
Chris@16 182 n.duration = RealTime::zeroTime;
Chris@16 183 return n;
Chris@16 184 }
Chris@16 185
Chris@16 186 n.time = m_pending.begin()->time;
Chris@16 187
Chris@16 188 Estimates::iterator i = m_pending.end();
Chris@16 189 --i;
Chris@16 190 n.duration = i->time - n.time;
Chris@16 191
Chris@17 192 // just mean frequency for now, but this isn't at all right perceptually
Chris@17 193 n.freq = getMeanFrequency();
Chris@16 194
Chris@16 195 return n;
Chris@16 196 }
Chris@16 197
Chris@11 198 void
Chris@16 199 CepstrumPitchTracker::Hypothesis::addFeatures(FeatureSet &fs)
Chris@11 200 {
Chris@11 201 for (int i = 0; i < m_pending.size(); ++i) {
Chris@11 202 Feature f;
Chris@11 203 f.hasTimestamp = true;
Chris@11 204 f.timestamp = m_pending[i].time;
Chris@11 205 f.values.push_back(m_pending[i].freq);
Chris@16 206 fs[0].push_back(f);
Chris@11 207 }
Chris@16 208
Chris@16 209 Feature nf;
Chris@16 210 nf.hasTimestamp = true;
Chris@16 211 nf.hasDuration = true;
Chris@16 212 Note n = getAveragedNote();
Chris@16 213 nf.timestamp = n.time;
Chris@16 214 nf.duration = n.duration;
Chris@16 215 nf.values.push_back(n.freq);
Chris@16 216 fs[1].push_back(nf);
Chris@11 217 }
Chris@3 218
Chris@3 219 CepstrumPitchTracker::CepstrumPitchTracker(float inputSampleRate) :
Chris@3 220 Plugin(inputSampleRate),
Chris@3 221 m_channels(0),
Chris@3 222 m_stepSize(256),
Chris@3 223 m_blockSize(1024),
Chris@3 224 m_fmin(50),
Chris@25 225 m_fmax(900),
Chris@18 226 m_vflen(1),
Chris@3 227 m_binFrom(0),
Chris@3 228 m_binTo(0),
Chris@15 229 m_bins(0)
Chris@3 230 {
Chris@3 231 }
Chris@3 232
Chris@3 233 CepstrumPitchTracker::~CepstrumPitchTracker()
Chris@3 234 {
Chris@3 235 }
Chris@3 236
Chris@3 237 string
Chris@3 238 CepstrumPitchTracker::getIdentifier() const
Chris@3 239 {
Chris@3 240 return "cepstrum-pitch";
Chris@3 241 }
Chris@3 242
Chris@3 243 string
Chris@3 244 CepstrumPitchTracker::getName() const
Chris@3 245 {
Chris@3 246 return "Cepstrum Pitch Tracker";
Chris@3 247 }
Chris@3 248
Chris@3 249 string
Chris@3 250 CepstrumPitchTracker::getDescription() const
Chris@3 251 {
Chris@3 252 return "Estimate f0 of monophonic material using a cepstrum method.";
Chris@3 253 }
Chris@3 254
Chris@3 255 string
Chris@3 256 CepstrumPitchTracker::getMaker() const
Chris@3 257 {
Chris@3 258 return "Chris Cannam";
Chris@3 259 }
Chris@3 260
Chris@3 261 int
Chris@3 262 CepstrumPitchTracker::getPluginVersion() const
Chris@3 263 {
Chris@3 264 // Increment this each time you release a version that behaves
Chris@3 265 // differently from the previous one
Chris@3 266 return 1;
Chris@3 267 }
Chris@3 268
Chris@3 269 string
Chris@3 270 CepstrumPitchTracker::getCopyright() const
Chris@3 271 {
Chris@3 272 return "Freely redistributable (BSD license)";
Chris@3 273 }
Chris@3 274
Chris@3 275 CepstrumPitchTracker::InputDomain
Chris@3 276 CepstrumPitchTracker::getInputDomain() const
Chris@3 277 {
Chris@3 278 return FrequencyDomain;
Chris@3 279 }
Chris@3 280
Chris@3 281 size_t
Chris@3 282 CepstrumPitchTracker::getPreferredBlockSize() const
Chris@3 283 {
Chris@3 284 return 1024;
Chris@3 285 }
Chris@3 286
Chris@3 287 size_t
Chris@3 288 CepstrumPitchTracker::getPreferredStepSize() const
Chris@3 289 {
Chris@3 290 return 256;
Chris@3 291 }
Chris@3 292
Chris@3 293 size_t
Chris@3 294 CepstrumPitchTracker::getMinChannelCount() const
Chris@3 295 {
Chris@3 296 return 1;
Chris@3 297 }
Chris@3 298
Chris@3 299 size_t
Chris@3 300 CepstrumPitchTracker::getMaxChannelCount() const
Chris@3 301 {
Chris@3 302 return 1;
Chris@3 303 }
Chris@3 304
Chris@3 305 CepstrumPitchTracker::ParameterList
Chris@3 306 CepstrumPitchTracker::getParameterDescriptors() const
Chris@3 307 {
Chris@3 308 ParameterList list;
Chris@3 309 return list;
Chris@3 310 }
Chris@3 311
Chris@3 312 float
Chris@3 313 CepstrumPitchTracker::getParameter(string identifier) const
Chris@3 314 {
Chris@3 315 return 0.f;
Chris@3 316 }
Chris@3 317
Chris@3 318 void
Chris@3 319 CepstrumPitchTracker::setParameter(string identifier, float value)
Chris@3 320 {
Chris@3 321 }
Chris@3 322
Chris@3 323 CepstrumPitchTracker::ProgramList
Chris@3 324 CepstrumPitchTracker::getPrograms() const
Chris@3 325 {
Chris@3 326 ProgramList list;
Chris@3 327 return list;
Chris@3 328 }
Chris@3 329
Chris@3 330 string
Chris@3 331 CepstrumPitchTracker::getCurrentProgram() const
Chris@3 332 {
Chris@3 333 return ""; // no programs
Chris@3 334 }
Chris@3 335
Chris@3 336 void
Chris@3 337 CepstrumPitchTracker::selectProgram(string name)
Chris@3 338 {
Chris@3 339 }
Chris@3 340
Chris@3 341 CepstrumPitchTracker::OutputList
Chris@3 342 CepstrumPitchTracker::getOutputDescriptors() const
Chris@3 343 {
Chris@3 344 OutputList outputs;
Chris@3 345
Chris@3 346 int n = 0;
Chris@3 347
Chris@3 348 OutputDescriptor d;
Chris@3 349
Chris@3 350 d.identifier = "f0";
Chris@3 351 d.name = "Estimated f0";
Chris@3 352 d.description = "Estimated fundamental frequency";
Chris@3 353 d.unit = "Hz";
Chris@3 354 d.hasFixedBinCount = true;
Chris@3 355 d.binCount = 1;
Chris@3 356 d.hasKnownExtents = true;
Chris@3 357 d.minValue = m_fmin;
Chris@3 358 d.maxValue = m_fmax;
Chris@3 359 d.isQuantized = false;
Chris@3 360 d.sampleType = OutputDescriptor::FixedSampleRate;
Chris@3 361 d.sampleRate = (m_inputSampleRate / m_stepSize);
Chris@3 362 d.hasDuration = false;
Chris@3 363 outputs.push_back(d);
Chris@3 364
Chris@16 365 d.identifier = "notes";
Chris@16 366 d.name = "Notes";
Chris@16 367 d.description = "Derived fixed-pitch note frequencies";
Chris@16 368 d.unit = "Hz";
Chris@16 369 d.hasFixedBinCount = true;
Chris@16 370 d.binCount = 1;
Chris@16 371 d.hasKnownExtents = true;
Chris@16 372 d.minValue = m_fmin;
Chris@16 373 d.maxValue = m_fmax;
Chris@16 374 d.isQuantized = false;
Chris@16 375 d.sampleType = OutputDescriptor::FixedSampleRate;
Chris@16 376 d.sampleRate = (m_inputSampleRate / m_stepSize);
Chris@16 377 d.hasDuration = true;
Chris@16 378 outputs.push_back(d);
Chris@16 379
Chris@3 380 return outputs;
Chris@3 381 }
Chris@3 382
Chris@3 383 bool
Chris@3 384 CepstrumPitchTracker::initialise(size_t channels, size_t stepSize, size_t blockSize)
Chris@3 385 {
Chris@3 386 if (channels < getMinChannelCount() ||
Chris@3 387 channels > getMaxChannelCount()) return false;
Chris@3 388
Chris@3 389 // std::cerr << "CepstrumPitchTracker::initialise: channels = " << channels
Chris@3 390 // << ", stepSize = " << stepSize << ", blockSize = " << blockSize
Chris@3 391 // << std::endl;
Chris@3 392
Chris@3 393 m_channels = channels;
Chris@3 394 m_stepSize = stepSize;
Chris@3 395 m_blockSize = blockSize;
Chris@3 396
Chris@3 397 m_binFrom = int(m_inputSampleRate / m_fmax);
Chris@3 398 m_binTo = int(m_inputSampleRate / m_fmin);
Chris@3 399
Chris@3 400 if (m_binTo >= (int)m_blockSize / 2) {
Chris@3 401 m_binTo = m_blockSize / 2 - 1;
Chris@3 402 }
Chris@3 403
Chris@3 404 m_bins = (m_binTo - m_binFrom) + 1;
Chris@3 405
Chris@3 406 reset();
Chris@3 407
Chris@3 408 return true;
Chris@3 409 }
Chris@3 410
Chris@3 411 void
Chris@3 412 CepstrumPitchTracker::reset()
Chris@3 413 {
Chris@3 414 }
Chris@3 415
Chris@3 416 void
Chris@15 417 CepstrumPitchTracker::filter(const double *cep, double *data)
Chris@3 418 {
Chris@3 419 for (int i = 0; i < m_bins; ++i) {
Chris@5 420 double v = 0;
Chris@5 421 int n = 0;
Chris@5 422 // average according to the vertical filter length
Chris@5 423 for (int j = -m_vflen/2; j <= m_vflen/2; ++j) {
Chris@5 424 int ix = i + m_binFrom + j;
Chris@5 425 if (ix >= 0 && ix < m_blockSize) {
Chris@5 426 v += cep[ix];
Chris@5 427 ++n;
Chris@5 428 }
Chris@5 429 }
Chris@15 430 data[i] = v / n;
Chris@3 431 }
Chris@6 432 }
Chris@6 433
Chris@18 434 double
Chris@18 435 CepstrumPitchTracker::cubicInterpolate(const double y[4], double x)
Chris@18 436 {
Chris@18 437 double a0 = y[3] - y[2] - y[0] + y[1];
Chris@18 438 double a1 = y[0] - y[1] - a0;
Chris@18 439 double a2 = y[2] - y[0];
Chris@18 440 double a3 = y[1];
Chris@18 441 return
Chris@18 442 a0 * x * x * x +
Chris@18 443 a1 * x * x +
Chris@18 444 a2 * x +
Chris@18 445 a3;
Chris@18 446 }
Chris@18 447
Chris@18 448 double
Chris@18 449 CepstrumPitchTracker::findInterpolatedPeak(const double *in, int maxbin)
Chris@18 450 {
Chris@18 451 if (maxbin < 2 || maxbin > m_bins - 3) {
Chris@18 452 return maxbin;
Chris@18 453 }
Chris@18 454
Chris@18 455 double maxval = 0.0;
Chris@18 456 double maxidx = maxbin;
Chris@18 457
Chris@18 458 const int divisions = 10;
Chris@18 459 double y[4];
Chris@18 460
Chris@18 461 y[0] = in[maxbin-1];
Chris@18 462 y[1] = in[maxbin];
Chris@18 463 y[2] = in[maxbin+1];
Chris@18 464 y[3] = in[maxbin+2];
Chris@18 465 for (int i = 0; i < divisions; ++i) {
Chris@18 466 double probe = double(i) / double(divisions);
Chris@18 467 double value = cubicInterpolate(y, probe);
Chris@18 468 if (value > maxval) {
Chris@18 469 maxval = value;
Chris@18 470 maxidx = maxbin + probe;
Chris@18 471 }
Chris@18 472 }
Chris@18 473
Chris@18 474 y[3] = y[2];
Chris@18 475 y[2] = y[1];
Chris@18 476 y[1] = y[0];
Chris@18 477 y[0] = in[maxbin-2];
Chris@18 478 for (int i = 0; i < divisions; ++i) {
Chris@18 479 double probe = double(i) / double(divisions);
Chris@18 480 double value = cubicInterpolate(y, probe);
Chris@18 481 if (value > maxval) {
Chris@18 482 maxval = value;
Chris@18 483 maxidx = maxbin - 1 + probe;
Chris@18 484 }
Chris@18 485 }
Chris@18 486
Chris@18 487 /*
Chris@18 488 std::cerr << "centre = " << maxbin << ": ["
Chris@18 489 << in[maxbin-2] << ","
Chris@18 490 << in[maxbin-1] << ","
Chris@18 491 << in[maxbin] << ","
Chris@18 492 << in[maxbin+1] << ","
Chris@18 493 << in[maxbin+2] << "] -> " << maxidx << std::endl;
Chris@18 494 */
Chris@18 495
Chris@18 496 return maxidx;
Chris@18 497 }
Chris@18 498
Chris@3 499 CepstrumPitchTracker::FeatureSet
Chris@16 500 CepstrumPitchTracker::process(const float *const *inputBuffers, RealTime timestamp)
Chris@3 501 {
Chris@3 502 FeatureSet fs;
Chris@3 503
Chris@3 504 int bs = m_blockSize;
Chris@3 505 int hs = m_blockSize/2 + 1;
Chris@3 506
Chris@3 507 double *rawcep = new double[bs];
Chris@3 508 double *io = new double[bs];
Chris@3 509 double *logmag = new double[bs];
Chris@3 510
Chris@4 511 // The "inverse symmetric" method. Seems to be the most reliable
Chris@3 512
Chris@25 513 double magmean = 0.0;
Chris@25 514
Chris@3 515 for (int i = 0; i < hs; ++i) {
Chris@3 516
Chris@3 517 double power =
Chris@3 518 inputBuffers[0][i*2 ] * inputBuffers[0][i*2 ] +
Chris@3 519 inputBuffers[0][i*2+1] * inputBuffers[0][i*2+1];
Chris@3 520 double mag = sqrt(power);
Chris@25 521
Chris@25 522 magmean += mag;
Chris@25 523
Chris@3 524 double lm = log(mag + 0.00000001);
Chris@3 525
Chris@4 526 logmag[i] = lm;
Chris@4 527 if (i > 0) logmag[bs - i] = lm;
Chris@3 528 }
Chris@3 529
Chris@25 530 magmean /= hs;
Chris@25 531 double threshold = 0.1; // for magmean
Chris@25 532
Chris@4 533 fft(bs, true, logmag, 0, rawcep, io);
Chris@3 534
Chris@3 535 delete[] logmag;
Chris@3 536 delete[] io;
Chris@3 537
Chris@3 538 int n = m_bins;
Chris@3 539 double *data = new double[n];
Chris@3 540 filter(rawcep, data);
Chris@3 541 delete[] rawcep;
Chris@3 542
Chris@3 543 double maxval = 0.0;
Chris@6 544 int maxbin = -1;
Chris@3 545
Chris@3 546 for (int i = 0; i < n; ++i) {
Chris@3 547 if (data[i] > maxval) {
Chris@3 548 maxval = data[i];
Chris@3 549 maxbin = i;
Chris@3 550 }
Chris@3 551 }
Chris@3 552
Chris@15 553 if (maxbin < 0) {
Chris@15 554 delete[] data;
Chris@15 555 return fs;
Chris@15 556 }
Chris@15 557
Chris@15 558 double nextPeakVal = 0.0;
Chris@15 559 for (int i = 1; i+1 < n; ++i) {
Chris@15 560 if (data[i] > data[i-1] &&
Chris@15 561 data[i] > data[i+1] &&
Chris@15 562 i != maxbin &&
Chris@15 563 data[i] > nextPeakVal) {
Chris@15 564 nextPeakVal = data[i];
Chris@15 565 }
Chris@15 566 }
Chris@8 567
Chris@18 568 double cimax = findInterpolatedPeak(data, maxbin);
Chris@18 569 double peakfreq = m_inputSampleRate / (cimax + m_binFrom);
Chris@15 570
Chris@15 571 double confidence = 0.0;
Chris@15 572 if (nextPeakVal != 0.0) {
Chris@25 573 confidence = (maxval - nextPeakVal) / 100.0;
Chris@25 574 if (magmean < threshold) confidence = 0.0;
Chris@25 575 std::cerr << "magmean = " << magmean << ", confidence = " << confidence << std::endl;
Chris@15 576 }
Chris@15 577
Chris@8 578 Hypothesis::Estimate e;
Chris@8 579 e.freq = peakfreq;
Chris@8 580 e.time = timestamp;
Chris@15 581 e.confidence = confidence;
Chris@8 582
Chris@8 583 m_accepted.advanceTime();
Chris@11 584
Chris@8 585 for (int i = 0; i < m_possible.size(); ++i) {
Chris@8 586 m_possible[i].advanceTime();
Chris@8 587 }
Chris@8 588
Chris@11 589 if (!m_accepted.test(e)) {
Chris@13 590
Chris@11 591 int candidate = -1;
Chris@13 592 bool accepted = false;
Chris@13 593
Chris@11 594 for (int i = 0; i < m_possible.size(); ++i) {
Chris@11 595 if (m_possible[i].test(e)) {
Chris@13 596 accepted = true;
Chris@11 597 if (m_possible[i].getState() == Hypothesis::Satisfied) {
Chris@11 598 candidate = i;
Chris@11 599 }
Chris@11 600 break;
Chris@11 601 }
Chris@11 602 }
Chris@12 603
Chris@13 604 if (!accepted) {
Chris@13 605 Hypothesis h;
Chris@13 606 h.test(e); //!!! must succeed as h is new, so perhaps there should be a ctor for this
Chris@13 607 m_possible.push_back(h);
Chris@13 608 }
Chris@13 609
Chris@11 610 if (m_accepted.getState() == Hypothesis::Expired) {
Chris@16 611 m_accepted.addFeatures(fs);
Chris@12 612 }
Chris@12 613
Chris@12 614 if (m_accepted.getState() == Hypothesis::Expired ||
Chris@12 615 m_accepted.getState() == Hypothesis::Rejected) {
Chris@11 616 if (candidate >= 0) {
Chris@11 617 m_accepted = m_possible[candidate];
Chris@11 618 } else {
Chris@11 619 m_accepted = Hypothesis();
Chris@11 620 }
Chris@11 621 }
Chris@8 622
Chris@14 623 // reap rejected/expired hypotheses from possible list
Chris@14 624 Hypotheses toReap = m_possible;
Chris@14 625 m_possible.clear();
Chris@14 626 for (int i = 0; i < toReap.size(); ++i) {
Chris@14 627 Hypothesis h = toReap[i];
Chris@14 628 if (h.getState() != Hypothesis::Rejected &&
Chris@14 629 h.getState() != Hypothesis::Expired) {
Chris@14 630 m_possible.push_back(h);
Chris@14 631 }
Chris@14 632 }
Chris@14 633 }
Chris@14 634
Chris@15 635 std::cerr << "accepted length = " << m_accepted.getPendingLength()
Chris@15 636 << ", state = " << m_accepted.getState()
Chris@15 637 << ", hypothesis count = " << m_possible.size() << std::endl;
Chris@12 638
Chris@3 639 delete[] data;
Chris@3 640 return fs;
Chris@3 641 }
Chris@3 642
Chris@3 643 CepstrumPitchTracker::FeatureSet
Chris@3 644 CepstrumPitchTracker::getRemainingFeatures()
Chris@3 645 {
Chris@3 646 FeatureSet fs;
Chris@15 647 if (m_accepted.getState() == Hypothesis::Satisfied) {
Chris@16 648 m_accepted.addFeatures(fs);
Chris@11 649 }
Chris@3 650 return fs;
Chris@3 651 }
Chris@3 652
Chris@3 653 void
Chris@3 654 CepstrumPitchTracker::fft(unsigned int n, bool inverse,
Chris@24 655 double *ri, double *ii, double *ro, double *io)
Chris@3 656 {
Chris@3 657 if (!ri || !ro || !io) return;
Chris@3 658
Chris@3 659 unsigned int bits;
Chris@3 660 unsigned int i, j, k, m;
Chris@3 661 unsigned int blockSize, blockEnd;
Chris@3 662
Chris@3 663 double tr, ti;
Chris@3 664
Chris@3 665 if (n < 2) return;
Chris@3 666 if (n & (n-1)) return;
Chris@3 667
Chris@3 668 double angle = 2.0 * M_PI;
Chris@3 669 if (inverse) angle = -angle;
Chris@3 670
Chris@3 671 for (i = 0; ; ++i) {
Chris@3 672 if (n & (1 << i)) {
Chris@3 673 bits = i;
Chris@3 674 break;
Chris@3 675 }
Chris@3 676 }
Chris@3 677
Chris@24 678 int table[n];
Chris@3 679
Chris@23 680 for (i = 0; i < n; ++i) {
Chris@23 681 m = i;
Chris@23 682 for (j = k = 0; j < bits; ++j) {
Chris@23 683 k = (k << 1) | (m & 1);
Chris@23 684 m >>= 1;
Chris@23 685 }
Chris@23 686 table[i] = k;
Chris@3 687 }
Chris@3 688
Chris@3 689 if (ii) {
Chris@3 690 for (i = 0; i < n; ++i) {
Chris@3 691 ro[table[i]] = ri[i];
Chris@3 692 io[table[i]] = ii[i];
Chris@3 693 }
Chris@3 694 } else {
Chris@3 695 for (i = 0; i < n; ++i) {
Chris@3 696 ro[table[i]] = ri[i];
Chris@3 697 io[table[i]] = 0.0;
Chris@3 698 }
Chris@3 699 }
Chris@3 700
Chris@3 701 blockEnd = 1;
Chris@3 702
Chris@3 703 for (blockSize = 2; blockSize <= n; blockSize <<= 1) {
Chris@3 704
Chris@3 705 double delta = angle / (double)blockSize;
Chris@3 706 double sm2 = -sin(-2 * delta);
Chris@3 707 double sm1 = -sin(-delta);
Chris@3 708 double cm2 = cos(-2 * delta);
Chris@3 709 double cm1 = cos(-delta);
Chris@3 710 double w = 2 * cm1;
Chris@3 711 double ar[3], ai[3];
Chris@3 712
Chris@3 713 for (i = 0; i < n; i += blockSize) {
Chris@3 714
Chris@3 715 ar[2] = cm2;
Chris@3 716 ar[1] = cm1;
Chris@3 717
Chris@3 718 ai[2] = sm2;
Chris@3 719 ai[1] = sm1;
Chris@3 720
Chris@3 721 for (j = i, m = 0; m < blockEnd; j++, m++) {
Chris@3 722
Chris@3 723 ar[0] = w * ar[1] - ar[2];
Chris@3 724 ar[2] = ar[1];
Chris@3 725 ar[1] = ar[0];
Chris@3 726
Chris@3 727 ai[0] = w * ai[1] - ai[2];
Chris@3 728 ai[2] = ai[1];
Chris@3 729 ai[1] = ai[0];
Chris@3 730
Chris@3 731 k = j + blockEnd;
Chris@3 732 tr = ar[0] * ro[k] - ai[0] * io[k];
Chris@3 733 ti = ar[0] * io[k] + ai[0] * ro[k];
Chris@3 734
Chris@3 735 ro[k] = ro[j] - tr;
Chris@3 736 io[k] = io[j] - ti;
Chris@3 737
Chris@3 738 ro[j] += tr;
Chris@3 739 io[j] += ti;
Chris@3 740 }
Chris@3 741 }
Chris@3 742
Chris@3 743 blockEnd = blockSize;
Chris@3 744 }
Chris@3 745 }
Chris@3 746
Chris@3 747