annotate CepstrumPitchTracker.cpp @ 27:44bb93cae288

Change peak-to-next-peak ratio to a difference (because difference of peaks in log values don't vary with signal amplification)
author Chris Cannam
date Sat, 07 Jul 2012 21:06:37 +0100
parents a15d8c89a36e
children 8a77e4de0d46
rev   line source
Chris@8 1 /* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */
Chris@8 2 /*
Chris@8 3 Permission is hereby granted, free of charge, to any person
Chris@8 4 obtaining a copy of this software and associated documentation
Chris@8 5 files (the "Software"), to deal in the Software without
Chris@8 6 restriction, including without limitation the rights to use, copy,
Chris@8 7 modify, merge, publish, distribute, sublicense, and/or sell copies
Chris@8 8 of the Software, and to permit persons to whom the Software is
Chris@8 9 furnished to do so, subject to the following conditions:
Chris@8 10
Chris@8 11 The above copyright notice and this permission notice shall be
Chris@8 12 included in all copies or substantial portions of the Software.
Chris@8 13
Chris@8 14 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
Chris@8 15 EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
Chris@8 16 MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
Chris@8 17 NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS BE LIABLE FOR
Chris@8 18 ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF
Chris@8 19 CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
Chris@8 20 WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
Chris@8 21 */
Chris@8 22
Chris@8 23 #include "CepstrumPitchTracker.h"
Chris@8 24
Chris@8 25 #include <vector>
Chris@8 26 #include <algorithm>
Chris@8 27
Chris@8 28 #include <cstdio>
Chris@8 29 #include <cmath>
Chris@8 30 #include <complex>
Chris@8 31
Chris@8 32 using std::string;
Chris@12 33 using std::vector;
Chris@21 34 using Vamp::RealTime;
Chris@12 35
Chris@13 36 CepstrumPitchTracker::Hypothesis::Hypothesis()
Chris@12 37 {
Chris@13 38 m_state = New;
Chris@12 39 m_age = 0;
Chris@12 40 }
Chris@12 41
Chris@16 42 CepstrumPitchTracker::Hypothesis::~Hypothesis()
Chris@16 43 {
Chris@16 44 }
Chris@16 45
Chris@12 46 bool
Chris@12 47 CepstrumPitchTracker::Hypothesis::isWithinTolerance(Estimate s)
Chris@12 48 {
Chris@12 49 if (m_pending.empty()) {
Chris@12 50 return true;
Chris@12 51 }
Chris@21 52
Chris@21 53 // check we are within a relatively close tolerance of the last
Chris@21 54 // candidate
Chris@22 55 Estimate last = m_pending[m_pending.size()-1];
Chris@12 56 double r = s.freq / last.freq;
Chris@12 57 int cents = lrint(1200.0 * (log(r) / log(2.0)));
Chris@22 58 if (cents < -60 || cents > 60) return false;
Chris@21 59
Chris@22 60 // and within a slightly bigger tolerance of the current mean
Chris@22 61 double meanFreq = getMeanFrequency();
Chris@22 62 r = s.freq / meanFreq;
Chris@21 63 cents = lrint(1200.0 * (log(r) / log(2.0)));
Chris@21 64 if (cents < -80 || cents > 80) return false;
Chris@21 65
Chris@21 66 return true;
Chris@12 67 }
Chris@12 68
Chris@12 69 bool
Chris@12 70 CepstrumPitchTracker::Hypothesis::isSatisfied()
Chris@12 71 {
Chris@20 72 if (m_pending.empty()) return false;
Chris@20 73
Chris@20 74 double meanConfidence = 0.0;
Chris@20 75 for (int i = 0; i < m_pending.size(); ++i) {
Chris@20 76 meanConfidence += m_pending[i].confidence;
Chris@20 77 }
Chris@20 78 meanConfidence /= m_pending.size();
Chris@20 79
Chris@20 80 int lengthRequired = int(2.0 / meanConfidence + 0.5);
Chris@20 81 std::cerr << "meanConfidence = " << meanConfidence << ", lengthRequired = " << lengthRequired << ", length = " << m_pending.size() << std::endl;
Chris@20 82
Chris@20 83 return (m_pending.size() > lengthRequired);
Chris@12 84 }
Chris@12 85
Chris@13 86 void
Chris@13 87 CepstrumPitchTracker::Hypothesis::advanceTime()
Chris@13 88 {
Chris@13 89 ++m_age;
Chris@13 90 }
Chris@13 91
Chris@12 92 bool
Chris@12 93 CepstrumPitchTracker::Hypothesis::test(Estimate s)
Chris@12 94 {
Chris@13 95 bool accept = false;
Chris@13 96
Chris@13 97 switch (m_state) {
Chris@13 98
Chris@13 99 case New:
Chris@13 100 m_state = Provisional;
Chris@13 101 accept = true;
Chris@13 102 break;
Chris@13 103
Chris@13 104 case Provisional:
Chris@13 105 if (m_age > 3) {
Chris@13 106 m_state = Rejected;
Chris@13 107 } else if (isWithinTolerance(s)) {
Chris@13 108 accept = true;
Chris@13 109 }
Chris@13 110 break;
Chris@13 111
Chris@13 112 case Satisfied:
Chris@13 113 if (m_age > 3) {
Chris@13 114 m_state = Expired;
Chris@13 115 } else if (isWithinTolerance(s)) {
Chris@13 116 accept = true;
Chris@13 117 }
Chris@13 118 break;
Chris@13 119
Chris@13 120 case Rejected:
Chris@13 121 break;
Chris@13 122
Chris@13 123 case Expired:
Chris@13 124 break;
Chris@12 125 }
Chris@12 126
Chris@13 127 if (accept) {
Chris@13 128 m_pending.push_back(s);
Chris@13 129 m_age = 0;
Chris@13 130 if (m_state == Provisional && isSatisfied()) {
Chris@13 131 m_state = Satisfied;
Chris@12 132 }
Chris@12 133 }
Chris@12 134
Chris@19 135 return accept && (m_state == Satisfied);
Chris@13 136 }
Chris@12 137
Chris@12 138 CepstrumPitchTracker::Hypothesis::State
Chris@12 139 CepstrumPitchTracker::Hypothesis::getState()
Chris@12 140 {
Chris@12 141 return m_state;
Chris@12 142 }
Chris@12 143
Chris@17 144 int
Chris@17 145 CepstrumPitchTracker::Hypothesis::getPendingLength()
Chris@17 146 {
Chris@17 147 return m_pending.size();
Chris@17 148 }
Chris@17 149
Chris@12 150 CepstrumPitchTracker::Hypothesis::Estimates
Chris@12 151 CepstrumPitchTracker::Hypothesis::getAcceptedEstimates()
Chris@12 152 {
Chris@12 153 if (m_state == Satisfied || m_state == Expired) {
Chris@12 154 return m_pending;
Chris@12 155 } else {
Chris@12 156 return Estimates();
Chris@12 157 }
Chris@12 158 }
Chris@12 159
Chris@22 160 double
Chris@22 161 CepstrumPitchTracker::Hypothesis::getMeanFrequency()
Chris@22 162 {
Chris@22 163 double acc = 0.0;
Chris@22 164 for (int i = 0; i < m_pending.size(); ++i) {
Chris@22 165 acc += m_pending[i].freq;
Chris@22 166 }
Chris@22 167 acc /= m_pending.size();
Chris@22 168 return acc;
Chris@22 169 }
Chris@22 170
Chris@21 171 CepstrumPitchTracker::Hypothesis::Note
Chris@21 172 CepstrumPitchTracker::Hypothesis::getAveragedNote()
Chris@21 173 {
Chris@21 174 Note n;
Chris@21 175
Chris@21 176 if (!(m_state == Satisfied || m_state == Expired)) {
Chris@21 177 n.freq = 0.0;
Chris@21 178 n.time = RealTime::zeroTime;
Chris@21 179 n.duration = RealTime::zeroTime;
Chris@21 180 return n;
Chris@21 181 }
Chris@21 182
Chris@21 183 n.time = m_pending.begin()->time;
Chris@21 184
Chris@21 185 Estimates::iterator i = m_pending.end();
Chris@21 186 --i;
Chris@21 187 n.duration = i->time - n.time;
Chris@21 188
Chris@22 189 // just mean frequency for now, but this isn't at all right perceptually
Chris@22 190 n.freq = getMeanFrequency();
Chris@21 191
Chris@21 192 return n;
Chris@21 193 }
Chris@21 194
Chris@16 195 void
Chris@21 196 CepstrumPitchTracker::Hypothesis::addFeatures(FeatureSet &fs)
Chris@16 197 {
Chris@16 198 for (int i = 0; i < m_pending.size(); ++i) {
Chris@16 199 Feature f;
Chris@16 200 f.hasTimestamp = true;
Chris@16 201 f.timestamp = m_pending[i].time;
Chris@16 202 f.values.push_back(m_pending[i].freq);
Chris@21 203 fs[0].push_back(f);
Chris@16 204 }
Chris@21 205
Chris@21 206 Feature nf;
Chris@21 207 nf.hasTimestamp = true;
Chris@21 208 nf.hasDuration = true;
Chris@21 209 Note n = getAveragedNote();
Chris@21 210 nf.timestamp = n.time;
Chris@21 211 nf.duration = n.duration;
Chris@21 212 nf.values.push_back(n.freq);
Chris@21 213 fs[1].push_back(nf);
Chris@16 214 }
Chris@8 215
Chris@8 216 CepstrumPitchTracker::CepstrumPitchTracker(float inputSampleRate) :
Chris@8 217 Plugin(inputSampleRate),
Chris@8 218 m_channels(0),
Chris@8 219 m_stepSize(256),
Chris@8 220 m_blockSize(1024),
Chris@8 221 m_fmin(50),
Chris@8 222 m_fmax(1000),
Chris@25 223 m_vflen(1),
Chris@8 224 m_binFrom(0),
Chris@8 225 m_binTo(0),
Chris@20 226 m_bins(0)
Chris@8 227 {
Chris@8 228 }
Chris@8 229
Chris@8 230 CepstrumPitchTracker::~CepstrumPitchTracker()
Chris@8 231 {
Chris@8 232 }
Chris@8 233
Chris@8 234 string
Chris@8 235 CepstrumPitchTracker::getIdentifier() const
Chris@8 236 {
Chris@8 237 return "cepstrum-pitch";
Chris@8 238 }
Chris@8 239
Chris@8 240 string
Chris@8 241 CepstrumPitchTracker::getName() const
Chris@8 242 {
Chris@8 243 return "Cepstrum Pitch Tracker";
Chris@8 244 }
Chris@8 245
Chris@8 246 string
Chris@8 247 CepstrumPitchTracker::getDescription() const
Chris@8 248 {
Chris@8 249 return "Estimate f0 of monophonic material using a cepstrum method.";
Chris@8 250 }
Chris@8 251
Chris@8 252 string
Chris@8 253 CepstrumPitchTracker::getMaker() const
Chris@8 254 {
Chris@8 255 return "Chris Cannam";
Chris@8 256 }
Chris@8 257
Chris@8 258 int
Chris@8 259 CepstrumPitchTracker::getPluginVersion() const
Chris@8 260 {
Chris@8 261 // Increment this each time you release a version that behaves
Chris@8 262 // differently from the previous one
Chris@8 263 return 1;
Chris@8 264 }
Chris@8 265
Chris@8 266 string
Chris@8 267 CepstrumPitchTracker::getCopyright() const
Chris@8 268 {
Chris@8 269 return "Freely redistributable (BSD license)";
Chris@8 270 }
Chris@8 271
Chris@8 272 CepstrumPitchTracker::InputDomain
Chris@8 273 CepstrumPitchTracker::getInputDomain() const
Chris@8 274 {
Chris@8 275 return FrequencyDomain;
Chris@8 276 }
Chris@8 277
Chris@8 278 size_t
Chris@8 279 CepstrumPitchTracker::getPreferredBlockSize() const
Chris@8 280 {
Chris@8 281 return 1024;
Chris@8 282 }
Chris@8 283
Chris@8 284 size_t
Chris@8 285 CepstrumPitchTracker::getPreferredStepSize() const
Chris@8 286 {
Chris@8 287 return 256;
Chris@8 288 }
Chris@8 289
Chris@8 290 size_t
Chris@8 291 CepstrumPitchTracker::getMinChannelCount() const
Chris@8 292 {
Chris@8 293 return 1;
Chris@8 294 }
Chris@8 295
Chris@8 296 size_t
Chris@8 297 CepstrumPitchTracker::getMaxChannelCount() const
Chris@8 298 {
Chris@8 299 return 1;
Chris@8 300 }
Chris@8 301
Chris@8 302 CepstrumPitchTracker::ParameterList
Chris@8 303 CepstrumPitchTracker::getParameterDescriptors() const
Chris@8 304 {
Chris@8 305 ParameterList list;
Chris@8 306 return list;
Chris@8 307 }
Chris@8 308
Chris@8 309 float
Chris@8 310 CepstrumPitchTracker::getParameter(string identifier) const
Chris@8 311 {
Chris@8 312 return 0.f;
Chris@8 313 }
Chris@8 314
Chris@8 315 void
Chris@8 316 CepstrumPitchTracker::setParameter(string identifier, float value)
Chris@8 317 {
Chris@8 318 }
Chris@8 319
Chris@8 320 CepstrumPitchTracker::ProgramList
Chris@8 321 CepstrumPitchTracker::getPrograms() const
Chris@8 322 {
Chris@8 323 ProgramList list;
Chris@8 324 return list;
Chris@8 325 }
Chris@8 326
Chris@8 327 string
Chris@8 328 CepstrumPitchTracker::getCurrentProgram() const
Chris@8 329 {
Chris@8 330 return ""; // no programs
Chris@8 331 }
Chris@8 332
Chris@8 333 void
Chris@8 334 CepstrumPitchTracker::selectProgram(string name)
Chris@8 335 {
Chris@8 336 }
Chris@8 337
Chris@8 338 CepstrumPitchTracker::OutputList
Chris@8 339 CepstrumPitchTracker::getOutputDescriptors() const
Chris@8 340 {
Chris@8 341 OutputList outputs;
Chris@8 342
Chris@8 343 int n = 0;
Chris@8 344
Chris@8 345 OutputDescriptor d;
Chris@8 346
Chris@8 347 d.identifier = "f0";
Chris@8 348 d.name = "Estimated f0";
Chris@8 349 d.description = "Estimated fundamental frequency";
Chris@8 350 d.unit = "Hz";
Chris@8 351 d.hasFixedBinCount = true;
Chris@8 352 d.binCount = 1;
Chris@8 353 d.hasKnownExtents = true;
Chris@8 354 d.minValue = m_fmin;
Chris@8 355 d.maxValue = m_fmax;
Chris@8 356 d.isQuantized = false;
Chris@8 357 d.sampleType = OutputDescriptor::FixedSampleRate;
Chris@8 358 d.sampleRate = (m_inputSampleRate / m_stepSize);
Chris@8 359 d.hasDuration = false;
Chris@8 360 outputs.push_back(d);
Chris@8 361
Chris@21 362 d.identifier = "notes";
Chris@21 363 d.name = "Notes";
Chris@21 364 d.description = "Derived fixed-pitch note frequencies";
Chris@21 365 d.unit = "Hz";
Chris@21 366 d.hasFixedBinCount = true;
Chris@21 367 d.binCount = 1;
Chris@21 368 d.hasKnownExtents = true;
Chris@21 369 d.minValue = m_fmin;
Chris@21 370 d.maxValue = m_fmax;
Chris@21 371 d.isQuantized = false;
Chris@21 372 d.sampleType = OutputDescriptor::FixedSampleRate;
Chris@21 373 d.sampleRate = (m_inputSampleRate / m_stepSize);
Chris@21 374 d.hasDuration = true;
Chris@21 375 outputs.push_back(d);
Chris@21 376
Chris@8 377 return outputs;
Chris@8 378 }
Chris@8 379
Chris@8 380 bool
Chris@8 381 CepstrumPitchTracker::initialise(size_t channels, size_t stepSize, size_t blockSize)
Chris@8 382 {
Chris@8 383 if (channels < getMinChannelCount() ||
Chris@8 384 channels > getMaxChannelCount()) return false;
Chris@8 385
Chris@8 386 // std::cerr << "CepstrumPitchTracker::initialise: channels = " << channels
Chris@8 387 // << ", stepSize = " << stepSize << ", blockSize = " << blockSize
Chris@8 388 // << std::endl;
Chris@8 389
Chris@8 390 m_channels = channels;
Chris@8 391 m_stepSize = stepSize;
Chris@8 392 m_blockSize = blockSize;
Chris@8 393
Chris@8 394 m_binFrom = int(m_inputSampleRate / m_fmax);
Chris@8 395 m_binTo = int(m_inputSampleRate / m_fmin);
Chris@8 396
Chris@8 397 if (m_binTo >= (int)m_blockSize / 2) {
Chris@8 398 m_binTo = m_blockSize / 2 - 1;
Chris@8 399 }
Chris@8 400
Chris@8 401 m_bins = (m_binTo - m_binFrom) + 1;
Chris@8 402
Chris@8 403 reset();
Chris@8 404
Chris@8 405 return true;
Chris@8 406 }
Chris@8 407
Chris@8 408 void
Chris@8 409 CepstrumPitchTracker::reset()
Chris@8 410 {
Chris@8 411 }
Chris@8 412
Chris@8 413 void
Chris@20 414 CepstrumPitchTracker::filter(const double *cep, double *data)
Chris@8 415 {
Chris@8 416 for (int i = 0; i < m_bins; ++i) {
Chris@10 417 double v = 0;
Chris@10 418 int n = 0;
Chris@10 419 // average according to the vertical filter length
Chris@10 420 for (int j = -m_vflen/2; j <= m_vflen/2; ++j) {
Chris@10 421 int ix = i + m_binFrom + j;
Chris@10 422 if (ix >= 0 && ix < m_blockSize) {
Chris@10 423 v += cep[ix];
Chris@10 424 ++n;
Chris@10 425 }
Chris@10 426 }
Chris@20 427 data[i] = v / n;
Chris@8 428 }
Chris@11 429 }
Chris@11 430
Chris@25 431 double
Chris@25 432 CepstrumPitchTracker::cubicInterpolate(const double y[4], double x)
Chris@25 433 {
Chris@25 434 double a0 = y[3] - y[2] - y[0] + y[1];
Chris@25 435 double a1 = y[0] - y[1] - a0;
Chris@25 436 double a2 = y[2] - y[0];
Chris@25 437 double a3 = y[1];
Chris@25 438 return
Chris@25 439 a0 * x * x * x +
Chris@25 440 a1 * x * x +
Chris@25 441 a2 * x +
Chris@25 442 a3;
Chris@25 443 }
Chris@25 444
Chris@25 445 double
Chris@25 446 CepstrumPitchTracker::findInterpolatedPeak(const double *in, int maxbin)
Chris@25 447 {
Chris@25 448 if (maxbin < 2 || maxbin > m_bins - 3) {
Chris@25 449 return maxbin;
Chris@25 450 }
Chris@25 451
Chris@25 452 double maxval = 0.0;
Chris@25 453 double maxidx = maxbin;
Chris@25 454
Chris@25 455 const int divisions = 10;
Chris@25 456 double y[4];
Chris@25 457
Chris@25 458 y[0] = in[maxbin-1];
Chris@25 459 y[1] = in[maxbin];
Chris@25 460 y[2] = in[maxbin+1];
Chris@25 461 y[3] = in[maxbin+2];
Chris@25 462 for (int i = 0; i < divisions; ++i) {
Chris@25 463 double probe = double(i) / double(divisions);
Chris@25 464 double value = cubicInterpolate(y, probe);
Chris@25 465 if (value > maxval) {
Chris@25 466 maxval = value;
Chris@25 467 maxidx = maxbin + probe;
Chris@25 468 }
Chris@25 469 }
Chris@25 470
Chris@25 471 y[3] = y[2];
Chris@25 472 y[2] = y[1];
Chris@25 473 y[1] = y[0];
Chris@25 474 y[0] = in[maxbin-2];
Chris@25 475 for (int i = 0; i < divisions; ++i) {
Chris@25 476 double probe = double(i) / double(divisions);
Chris@25 477 double value = cubicInterpolate(y, probe);
Chris@25 478 if (value > maxval) {
Chris@25 479 maxval = value;
Chris@25 480 maxidx = maxbin - 1 + probe;
Chris@25 481 }
Chris@25 482 }
Chris@25 483
Chris@25 484 /*
Chris@25 485 std::cerr << "centre = " << maxbin << ": ["
Chris@25 486 << in[maxbin-2] << ","
Chris@25 487 << in[maxbin-1] << ","
Chris@25 488 << in[maxbin] << ","
Chris@25 489 << in[maxbin+1] << ","
Chris@25 490 << in[maxbin+2] << "] -> " << maxidx << std::endl;
Chris@25 491 */
Chris@25 492
Chris@25 493 return maxidx;
Chris@25 494 }
Chris@25 495
Chris@8 496 CepstrumPitchTracker::FeatureSet
Chris@21 497 CepstrumPitchTracker::process(const float *const *inputBuffers, RealTime timestamp)
Chris@8 498 {
Chris@8 499 FeatureSet fs;
Chris@8 500
Chris@8 501 int bs = m_blockSize;
Chris@8 502 int hs = m_blockSize/2 + 1;
Chris@8 503
Chris@8 504 double *rawcep = new double[bs];
Chris@8 505 double *io = new double[bs];
Chris@8 506 double *logmag = new double[bs];
Chris@8 507
Chris@9 508 // The "inverse symmetric" method. Seems to be the most reliable
Chris@8 509
Chris@8 510 for (int i = 0; i < hs; ++i) {
Chris@8 511
Chris@8 512 double power =
Chris@8 513 inputBuffers[0][i*2 ] * inputBuffers[0][i*2 ] +
Chris@8 514 inputBuffers[0][i*2+1] * inputBuffers[0][i*2+1];
Chris@8 515 double mag = sqrt(power);
Chris@8 516
Chris@8 517 double lm = log(mag + 0.00000001);
Chris@8 518
Chris@9 519 logmag[i] = lm;
Chris@9 520 if (i > 0) logmag[bs - i] = lm;
Chris@8 521 }
Chris@8 522
Chris@9 523 fft(bs, true, logmag, 0, rawcep, io);
Chris@8 524
Chris@8 525 delete[] logmag;
Chris@8 526 delete[] io;
Chris@8 527
Chris@8 528 int n = m_bins;
Chris@8 529 double *data = new double[n];
Chris@8 530 filter(rawcep, data);
Chris@8 531 delete[] rawcep;
Chris@8 532
Chris@8 533 double maxval = 0.0;
Chris@11 534 int maxbin = -1;
Chris@8 535
Chris@8 536 for (int i = 0; i < n; ++i) {
Chris@8 537 if (data[i] > maxval) {
Chris@8 538 maxval = data[i];
Chris@8 539 maxbin = i;
Chris@8 540 }
Chris@8 541 }
Chris@8 542
Chris@20 543 if (maxbin < 0) {
Chris@20 544 delete[] data;
Chris@20 545 return fs;
Chris@20 546 }
Chris@20 547
Chris@20 548 double nextPeakVal = 0.0;
Chris@20 549 for (int i = 1; i+1 < n; ++i) {
Chris@20 550 if (data[i] > data[i-1] &&
Chris@20 551 data[i] > data[i+1] &&
Chris@20 552 i != maxbin &&
Chris@20 553 data[i] > nextPeakVal) {
Chris@20 554 nextPeakVal = data[i];
Chris@20 555 }
Chris@20 556 }
Chris@13 557
Chris@25 558 double cimax = findInterpolatedPeak(data, maxbin);
Chris@25 559 double peakfreq = m_inputSampleRate / (cimax + m_binFrom);
Chris@20 560
Chris@20 561 double confidence = 0.0;
Chris@20 562 if (nextPeakVal != 0.0) {
Chris@27 563 confidence = (maxval - nextPeakVal) / 200.0;
Chris@20 564 if (confidence > 1.0) confidence = 1.0;
Chris@20 565 }
Chris@20 566
Chris@13 567 Hypothesis::Estimate e;
Chris@13 568 e.freq = peakfreq;
Chris@13 569 e.time = timestamp;
Chris@20 570 e.confidence = confidence;
Chris@13 571
Chris@13 572 m_accepted.advanceTime();
Chris@16 573
Chris@13 574 for (int i = 0; i < m_possible.size(); ++i) {
Chris@13 575 m_possible[i].advanceTime();
Chris@13 576 }
Chris@13 577
Chris@16 578 if (!m_accepted.test(e)) {
Chris@18 579
Chris@16 580 int candidate = -1;
Chris@18 581 bool accepted = false;
Chris@18 582
Chris@16 583 for (int i = 0; i < m_possible.size(); ++i) {
Chris@16 584 if (m_possible[i].test(e)) {
Chris@18 585 accepted = true;
Chris@16 586 if (m_possible[i].getState() == Hypothesis::Satisfied) {
Chris@16 587 candidate = i;
Chris@16 588 }
Chris@16 589 break;
Chris@16 590 }
Chris@16 591 }
Chris@17 592
Chris@18 593 if (!accepted) {
Chris@18 594 Hypothesis h;
Chris@18 595 h.test(e); //!!! must succeed as h is new, so perhaps there should be a ctor for this
Chris@18 596 m_possible.push_back(h);
Chris@18 597 }
Chris@18 598
Chris@16 599 if (m_accepted.getState() == Hypothesis::Expired) {
Chris@21 600 m_accepted.addFeatures(fs);
Chris@17 601 }
Chris@17 602
Chris@17 603 if (m_accepted.getState() == Hypothesis::Expired ||
Chris@17 604 m_accepted.getState() == Hypothesis::Rejected) {
Chris@16 605 if (candidate >= 0) {
Chris@16 606 m_accepted = m_possible[candidate];
Chris@16 607 } else {
Chris@16 608 m_accepted = Hypothesis();
Chris@16 609 }
Chris@16 610 }
Chris@13 611
Chris@19 612 // reap rejected/expired hypotheses from possible list
Chris@19 613 Hypotheses toReap = m_possible;
Chris@19 614 m_possible.clear();
Chris@19 615 for (int i = 0; i < toReap.size(); ++i) {
Chris@19 616 Hypothesis h = toReap[i];
Chris@19 617 if (h.getState() != Hypothesis::Rejected &&
Chris@19 618 h.getState() != Hypothesis::Expired) {
Chris@19 619 m_possible.push_back(h);
Chris@19 620 }
Chris@19 621 }
Chris@19 622 }
Chris@19 623
Chris@20 624 std::cerr << "accepted length = " << m_accepted.getPendingLength()
Chris@20 625 << ", state = " << m_accepted.getState()
Chris@20 626 << ", hypothesis count = " << m_possible.size() << std::endl;
Chris@17 627
Chris@8 628 delete[] data;
Chris@8 629 return fs;
Chris@8 630 }
Chris@8 631
Chris@8 632 CepstrumPitchTracker::FeatureSet
Chris@8 633 CepstrumPitchTracker::getRemainingFeatures()
Chris@8 634 {
Chris@8 635 FeatureSet fs;
Chris@20 636 if (m_accepted.getState() == Hypothesis::Satisfied) {
Chris@21 637 m_accepted.addFeatures(fs);
Chris@16 638 }
Chris@8 639 return fs;
Chris@8 640 }
Chris@8 641
Chris@8 642 void
Chris@8 643 CepstrumPitchTracker::fft(unsigned int n, bool inverse,
Chris@8 644 double *ri, double *ii, double *ro, double *io)
Chris@8 645 {
Chris@8 646 if (!ri || !ro || !io) return;
Chris@8 647
Chris@8 648 unsigned int bits;
Chris@8 649 unsigned int i, j, k, m;
Chris@8 650 unsigned int blockSize, blockEnd;
Chris@8 651
Chris@8 652 double tr, ti;
Chris@8 653
Chris@8 654 if (n < 2) return;
Chris@8 655 if (n & (n-1)) return;
Chris@8 656
Chris@8 657 double angle = 2.0 * M_PI;
Chris@8 658 if (inverse) angle = -angle;
Chris@8 659
Chris@8 660 for (i = 0; ; ++i) {
Chris@8 661 if (n & (1 << i)) {
Chris@8 662 bits = i;
Chris@8 663 break;
Chris@8 664 }
Chris@8 665 }
Chris@8 666
Chris@8 667 static unsigned int tableSize = 0;
Chris@8 668 static int *table = 0;
Chris@8 669
Chris@8 670 if (tableSize != n) {
Chris@8 671
Chris@8 672 delete[] table;
Chris@8 673
Chris@8 674 table = new int[n];
Chris@8 675
Chris@8 676 for (i = 0; i < n; ++i) {
Chris@8 677
Chris@8 678 m = i;
Chris@8 679
Chris@8 680 for (j = k = 0; j < bits; ++j) {
Chris@8 681 k = (k << 1) | (m & 1);
Chris@8 682 m >>= 1;
Chris@8 683 }
Chris@8 684
Chris@8 685 table[i] = k;
Chris@8 686 }
Chris@8 687
Chris@8 688 tableSize = n;
Chris@8 689 }
Chris@8 690
Chris@8 691 if (ii) {
Chris@8 692 for (i = 0; i < n; ++i) {
Chris@8 693 ro[table[i]] = ri[i];
Chris@8 694 io[table[i]] = ii[i];
Chris@8 695 }
Chris@8 696 } else {
Chris@8 697 for (i = 0; i < n; ++i) {
Chris@8 698 ro[table[i]] = ri[i];
Chris@8 699 io[table[i]] = 0.0;
Chris@8 700 }
Chris@8 701 }
Chris@8 702
Chris@8 703 blockEnd = 1;
Chris@8 704
Chris@8 705 for (blockSize = 2; blockSize <= n; blockSize <<= 1) {
Chris@8 706
Chris@8 707 double delta = angle / (double)blockSize;
Chris@8 708 double sm2 = -sin(-2 * delta);
Chris@8 709 double sm1 = -sin(-delta);
Chris@8 710 double cm2 = cos(-2 * delta);
Chris@8 711 double cm1 = cos(-delta);
Chris@8 712 double w = 2 * cm1;
Chris@8 713 double ar[3], ai[3];
Chris@8 714
Chris@8 715 for (i = 0; i < n; i += blockSize) {
Chris@8 716
Chris@8 717 ar[2] = cm2;
Chris@8 718 ar[1] = cm1;
Chris@8 719
Chris@8 720 ai[2] = sm2;
Chris@8 721 ai[1] = sm1;
Chris@8 722
Chris@8 723 for (j = i, m = 0; m < blockEnd; j++, m++) {
Chris@8 724
Chris@8 725 ar[0] = w * ar[1] - ar[2];
Chris@8 726 ar[2] = ar[1];
Chris@8 727 ar[1] = ar[0];
Chris@8 728
Chris@8 729 ai[0] = w * ai[1] - ai[2];
Chris@8 730 ai[2] = ai[1];
Chris@8 731 ai[1] = ai[0];
Chris@8 732
Chris@8 733 k = j + blockEnd;
Chris@8 734 tr = ar[0] * ro[k] - ai[0] * io[k];
Chris@8 735 ti = ar[0] * io[k] + ai[0] * ro[k];
Chris@8 736
Chris@8 737 ro[k] = ro[j] - tr;
Chris@8 738 io[k] = io[j] - ti;
Chris@8 739
Chris@8 740 ro[j] += tr;
Chris@8 741 io[j] += ti;
Chris@8 742 }
Chris@8 743 }
Chris@8 744
Chris@8 745 blockEnd = blockSize;
Chris@8 746 }
Chris@8 747 }
Chris@8 748
Chris@8 749