annotate CepstrumPitchTracker.cpp @ 19:c9cac05ef9f2 track

Reap expired/rejected hypotheses from list; report an estimate as accepted only if the accepting hypothesis has been satisfied already (otherwise a different provisional hypothesis might become satisfied first)
author Chris Cannam
date Sun, 01 Jul 2012 11:33:37 +0100
parents 791e5c115b8d
children 7786d595d2f2
rev   line source
Chris@8 1 /* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */
Chris@8 2 /*
Chris@8 3 Permission is hereby granted, free of charge, to any person
Chris@8 4 obtaining a copy of this software and associated documentation
Chris@8 5 files (the "Software"), to deal in the Software without
Chris@8 6 restriction, including without limitation the rights to use, copy,
Chris@8 7 modify, merge, publish, distribute, sublicense, and/or sell copies
Chris@8 8 of the Software, and to permit persons to whom the Software is
Chris@8 9 furnished to do so, subject to the following conditions:
Chris@8 10
Chris@8 11 The above copyright notice and this permission notice shall be
Chris@8 12 included in all copies or substantial portions of the Software.
Chris@8 13
Chris@8 14 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
Chris@8 15 EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
Chris@8 16 MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
Chris@8 17 NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS BE LIABLE FOR
Chris@8 18 ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF
Chris@8 19 CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
Chris@8 20 WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
Chris@8 21 */
Chris@8 22
Chris@8 23 #include "CepstrumPitchTracker.h"
Chris@8 24
Chris@8 25 #include <vector>
Chris@8 26 #include <algorithm>
Chris@8 27
Chris@8 28 #include <cstdio>
Chris@8 29 #include <cmath>
Chris@8 30 #include <complex>
Chris@8 31
Chris@8 32 using std::string;
Chris@12 33 using std::vector;
Chris@12 34
Chris@13 35 CepstrumPitchTracker::Hypothesis::Hypothesis()
Chris@12 36 {
Chris@13 37 m_state = New;
Chris@12 38 m_age = 0;
Chris@12 39 }
Chris@12 40
Chris@16 41 CepstrumPitchTracker::Hypothesis::~Hypothesis()
Chris@16 42 {
Chris@16 43 }
Chris@16 44
Chris@12 45 bool
Chris@12 46 CepstrumPitchTracker::Hypothesis::isWithinTolerance(Estimate s)
Chris@12 47 {
Chris@12 48 if (m_pending.empty()) {
Chris@12 49 return true;
Chris@12 50 }
Chris@12 51 Estimate last = m_pending[m_pending.size()-1];
Chris@12 52 double r = s.freq / last.freq;
Chris@12 53 int cents = lrint(1200.0 * (log(r) / log(2.0)));
Chris@19 54 return (cents > -100 && cents < 100);
Chris@12 55 }
Chris@12 56
Chris@12 57 bool
Chris@12 58 CepstrumPitchTracker::Hypothesis::isSatisfied()
Chris@12 59 {
Chris@12 60 return (m_pending.size() > 2);
Chris@12 61 }
Chris@12 62
Chris@13 63 void
Chris@13 64 CepstrumPitchTracker::Hypothesis::advanceTime()
Chris@13 65 {
Chris@13 66 ++m_age;
Chris@13 67 }
Chris@13 68
Chris@12 69 bool
Chris@12 70 CepstrumPitchTracker::Hypothesis::test(Estimate s)
Chris@12 71 {
Chris@13 72 bool accept = false;
Chris@13 73
Chris@13 74 switch (m_state) {
Chris@13 75
Chris@13 76 case New:
Chris@13 77 m_state = Provisional;
Chris@13 78 accept = true;
Chris@13 79 break;
Chris@13 80
Chris@13 81 case Provisional:
Chris@13 82 if (m_age > 3) {
Chris@13 83 m_state = Rejected;
Chris@13 84 } else if (isWithinTolerance(s)) {
Chris@13 85 accept = true;
Chris@13 86 }
Chris@13 87 break;
Chris@13 88
Chris@13 89 case Satisfied:
Chris@13 90 if (m_age > 3) {
Chris@13 91 m_state = Expired;
Chris@13 92 } else if (isWithinTolerance(s)) {
Chris@13 93 accept = true;
Chris@13 94 }
Chris@13 95 break;
Chris@13 96
Chris@13 97 case Rejected:
Chris@13 98 break;
Chris@13 99
Chris@13 100 case Expired:
Chris@13 101 break;
Chris@12 102 }
Chris@12 103
Chris@13 104 if (accept) {
Chris@13 105 m_pending.push_back(s);
Chris@13 106 m_age = 0;
Chris@13 107 if (m_state == Provisional && isSatisfied()) {
Chris@13 108 m_state = Satisfied;
Chris@12 109 }
Chris@12 110 }
Chris@12 111
Chris@19 112 return accept && (m_state == Satisfied);
Chris@13 113 }
Chris@12 114
Chris@12 115 CepstrumPitchTracker::Hypothesis::State
Chris@12 116 CepstrumPitchTracker::Hypothesis::getState()
Chris@12 117 {
Chris@12 118 return m_state;
Chris@12 119 }
Chris@12 120
Chris@17 121 int
Chris@17 122 CepstrumPitchTracker::Hypothesis::getPendingLength()
Chris@17 123 {
Chris@17 124 return m_pending.size();
Chris@17 125 }
Chris@17 126
Chris@12 127 CepstrumPitchTracker::Hypothesis::Estimates
Chris@12 128 CepstrumPitchTracker::Hypothesis::getAcceptedEstimates()
Chris@12 129 {
Chris@12 130 if (m_state == Satisfied || m_state == Expired) {
Chris@12 131 return m_pending;
Chris@12 132 } else {
Chris@12 133 return Estimates();
Chris@12 134 }
Chris@12 135 }
Chris@12 136
Chris@16 137 void
Chris@16 138 CepstrumPitchTracker::Hypothesis::addFeatures(FeatureList &fl)
Chris@16 139 {
Chris@16 140 for (int i = 0; i < m_pending.size(); ++i) {
Chris@16 141 Feature f;
Chris@16 142 f.hasTimestamp = true;
Chris@16 143 f.timestamp = m_pending[i].time;
Chris@16 144 f.values.push_back(m_pending[i].freq);
Chris@16 145 fl.push_back(f);
Chris@16 146 }
Chris@16 147 }
Chris@8 148
Chris@8 149 CepstrumPitchTracker::CepstrumPitchTracker(float inputSampleRate) :
Chris@8 150 Plugin(inputSampleRate),
Chris@8 151 m_channels(0),
Chris@8 152 m_stepSize(256),
Chris@8 153 m_blockSize(1024),
Chris@8 154 m_fmin(50),
Chris@8 155 m_fmax(1000),
Chris@10 156 m_histlen(1),
Chris@10 157 m_vflen(3),
Chris@8 158 m_binFrom(0),
Chris@8 159 m_binTo(0),
Chris@8 160 m_bins(0),
Chris@11 161 m_history(0),
Chris@11 162 m_prevpeak(0),
Chris@11 163 m_prevprop(0)
Chris@8 164 {
Chris@8 165 }
Chris@8 166
Chris@8 167 CepstrumPitchTracker::~CepstrumPitchTracker()
Chris@8 168 {
Chris@8 169 if (m_history) {
Chris@8 170 for (int i = 0; i < m_histlen; ++i) {
Chris@8 171 delete[] m_history[i];
Chris@8 172 }
Chris@8 173 delete[] m_history;
Chris@8 174 }
Chris@8 175 }
Chris@8 176
Chris@8 177 string
Chris@8 178 CepstrumPitchTracker::getIdentifier() const
Chris@8 179 {
Chris@8 180 return "cepstrum-pitch";
Chris@8 181 }
Chris@8 182
Chris@8 183 string
Chris@8 184 CepstrumPitchTracker::getName() const
Chris@8 185 {
Chris@8 186 return "Cepstrum Pitch Tracker";
Chris@8 187 }
Chris@8 188
Chris@8 189 string
Chris@8 190 CepstrumPitchTracker::getDescription() const
Chris@8 191 {
Chris@8 192 return "Estimate f0 of monophonic material using a cepstrum method.";
Chris@8 193 }
Chris@8 194
Chris@8 195 string
Chris@8 196 CepstrumPitchTracker::getMaker() const
Chris@8 197 {
Chris@8 198 return "Chris Cannam";
Chris@8 199 }
Chris@8 200
Chris@8 201 int
Chris@8 202 CepstrumPitchTracker::getPluginVersion() const
Chris@8 203 {
Chris@8 204 // Increment this each time you release a version that behaves
Chris@8 205 // differently from the previous one
Chris@8 206 return 1;
Chris@8 207 }
Chris@8 208
Chris@8 209 string
Chris@8 210 CepstrumPitchTracker::getCopyright() const
Chris@8 211 {
Chris@8 212 return "Freely redistributable (BSD license)";
Chris@8 213 }
Chris@8 214
Chris@8 215 CepstrumPitchTracker::InputDomain
Chris@8 216 CepstrumPitchTracker::getInputDomain() const
Chris@8 217 {
Chris@8 218 return FrequencyDomain;
Chris@8 219 }
Chris@8 220
Chris@8 221 size_t
Chris@8 222 CepstrumPitchTracker::getPreferredBlockSize() const
Chris@8 223 {
Chris@8 224 return 1024;
Chris@8 225 }
Chris@8 226
Chris@8 227 size_t
Chris@8 228 CepstrumPitchTracker::getPreferredStepSize() const
Chris@8 229 {
Chris@8 230 return 256;
Chris@8 231 }
Chris@8 232
Chris@8 233 size_t
Chris@8 234 CepstrumPitchTracker::getMinChannelCount() const
Chris@8 235 {
Chris@8 236 return 1;
Chris@8 237 }
Chris@8 238
Chris@8 239 size_t
Chris@8 240 CepstrumPitchTracker::getMaxChannelCount() const
Chris@8 241 {
Chris@8 242 return 1;
Chris@8 243 }
Chris@8 244
Chris@8 245 CepstrumPitchTracker::ParameterList
Chris@8 246 CepstrumPitchTracker::getParameterDescriptors() const
Chris@8 247 {
Chris@8 248 ParameterList list;
Chris@8 249 return list;
Chris@8 250 }
Chris@8 251
Chris@8 252 float
Chris@8 253 CepstrumPitchTracker::getParameter(string identifier) const
Chris@8 254 {
Chris@8 255 return 0.f;
Chris@8 256 }
Chris@8 257
Chris@8 258 void
Chris@8 259 CepstrumPitchTracker::setParameter(string identifier, float value)
Chris@8 260 {
Chris@8 261 }
Chris@8 262
Chris@8 263 CepstrumPitchTracker::ProgramList
Chris@8 264 CepstrumPitchTracker::getPrograms() const
Chris@8 265 {
Chris@8 266 ProgramList list;
Chris@8 267 return list;
Chris@8 268 }
Chris@8 269
Chris@8 270 string
Chris@8 271 CepstrumPitchTracker::getCurrentProgram() const
Chris@8 272 {
Chris@8 273 return ""; // no programs
Chris@8 274 }
Chris@8 275
Chris@8 276 void
Chris@8 277 CepstrumPitchTracker::selectProgram(string name)
Chris@8 278 {
Chris@8 279 }
Chris@8 280
Chris@8 281 CepstrumPitchTracker::OutputList
Chris@8 282 CepstrumPitchTracker::getOutputDescriptors() const
Chris@8 283 {
Chris@8 284 OutputList outputs;
Chris@8 285
Chris@8 286 int n = 0;
Chris@8 287
Chris@8 288 OutputDescriptor d;
Chris@8 289
Chris@8 290 d.identifier = "f0";
Chris@8 291 d.name = "Estimated f0";
Chris@8 292 d.description = "Estimated fundamental frequency";
Chris@8 293 d.unit = "Hz";
Chris@8 294 d.hasFixedBinCount = true;
Chris@8 295 d.binCount = 1;
Chris@8 296 d.hasKnownExtents = true;
Chris@8 297 d.minValue = m_fmin;
Chris@8 298 d.maxValue = m_fmax;
Chris@8 299 d.isQuantized = false;
Chris@8 300 d.sampleType = OutputDescriptor::FixedSampleRate;
Chris@8 301 d.sampleRate = (m_inputSampleRate / m_stepSize);
Chris@8 302 d.hasDuration = false;
Chris@8 303 outputs.push_back(d);
Chris@8 304
Chris@8 305 return outputs;
Chris@8 306 }
Chris@8 307
Chris@8 308 bool
Chris@8 309 CepstrumPitchTracker::initialise(size_t channels, size_t stepSize, size_t blockSize)
Chris@8 310 {
Chris@8 311 if (channels < getMinChannelCount() ||
Chris@8 312 channels > getMaxChannelCount()) return false;
Chris@8 313
Chris@8 314 // std::cerr << "CepstrumPitchTracker::initialise: channels = " << channels
Chris@8 315 // << ", stepSize = " << stepSize << ", blockSize = " << blockSize
Chris@8 316 // << std::endl;
Chris@8 317
Chris@8 318 m_channels = channels;
Chris@8 319 m_stepSize = stepSize;
Chris@8 320 m_blockSize = blockSize;
Chris@8 321
Chris@8 322 m_binFrom = int(m_inputSampleRate / m_fmax);
Chris@8 323 m_binTo = int(m_inputSampleRate / m_fmin);
Chris@8 324
Chris@8 325 if (m_binTo >= (int)m_blockSize / 2) {
Chris@8 326 m_binTo = m_blockSize / 2 - 1;
Chris@8 327 }
Chris@8 328
Chris@8 329 m_bins = (m_binTo - m_binFrom) + 1;
Chris@8 330
Chris@8 331 m_history = new double *[m_histlen];
Chris@8 332 for (int i = 0; i < m_histlen; ++i) {
Chris@8 333 m_history[i] = new double[m_bins];
Chris@8 334 }
Chris@8 335
Chris@8 336 reset();
Chris@8 337
Chris@8 338 return true;
Chris@8 339 }
Chris@8 340
Chris@8 341 void
Chris@8 342 CepstrumPitchTracker::reset()
Chris@8 343 {
Chris@8 344 for (int i = 0; i < m_histlen; ++i) {
Chris@8 345 for (int j = 0; j < m_bins; ++j) {
Chris@8 346 m_history[i][j] = 0.0;
Chris@8 347 }
Chris@8 348 }
Chris@8 349 }
Chris@8 350
Chris@8 351 void
Chris@8 352 CepstrumPitchTracker::filter(const double *cep, double *result)
Chris@8 353 {
Chris@8 354 int hix = m_histlen - 1; // current history index
Chris@8 355
Chris@8 356 // roll back the history
Chris@8 357 if (m_histlen > 1) {
Chris@8 358 double *oldest = m_history[0];
Chris@8 359 for (int i = 1; i < m_histlen; ++i) {
Chris@8 360 m_history[i-1] = m_history[i];
Chris@8 361 }
Chris@8 362 // and stick this back in the newest spot, to recycle
Chris@8 363 m_history[hix] = oldest;
Chris@8 364 }
Chris@8 365
Chris@8 366 for (int i = 0; i < m_bins; ++i) {
Chris@10 367 double v = 0;
Chris@10 368 int n = 0;
Chris@10 369 // average according to the vertical filter length
Chris@10 370 for (int j = -m_vflen/2; j <= m_vflen/2; ++j) {
Chris@10 371 int ix = i + m_binFrom + j;
Chris@10 372 if (ix >= 0 && ix < m_blockSize) {
Chris@10 373 v += cep[ix];
Chris@10 374 ++n;
Chris@10 375 }
Chris@10 376 }
Chris@10 377 m_history[hix][i] = v / n;
Chris@8 378 }
Chris@8 379
Chris@8 380 for (int i = 0; i < m_bins; ++i) {
Chris@8 381 double mean = 0.0;
Chris@8 382 for (int j = 0; j < m_histlen; ++j) {
Chris@8 383 mean += m_history[j][i];
Chris@8 384 }
Chris@8 385 mean /= m_histlen;
Chris@8 386 result[i] = mean;
Chris@8 387 }
Chris@8 388 }
Chris@8 389
Chris@11 390 double
Chris@11 391 CepstrumPitchTracker::calculatePeakProportion(const double *data, double abstot, int n)
Chris@11 392 {
Chris@11 393 double aroundPeak = data[n];
Chris@11 394 double peakProportion = 0.0;
Chris@11 395
Chris@11 396 int i = n - 1;
Chris@11 397 while (i > 0 && data[i] <= data[i+1]) {
Chris@11 398 aroundPeak += fabs(data[i]);
Chris@11 399 --i;
Chris@11 400 }
Chris@11 401 i = n + 1;
Chris@11 402 while (i < m_bins && data[i] <= data[i-1]) {
Chris@11 403 aroundPeak += fabs(data[i]);
Chris@11 404 ++i;
Chris@11 405 }
Chris@11 406 peakProportion = aroundPeak / abstot;
Chris@11 407
Chris@11 408 return peakProportion;
Chris@11 409 }
Chris@11 410
Chris@11 411 bool
Chris@11 412 CepstrumPitchTracker::acceptPeak(int n, double peakProportion)
Chris@11 413 {
Chris@11 414 bool accept = false;
Chris@11 415
Chris@11 416 if (abs(n - m_prevpeak) < 10) { //!!! should depend on bin count
Chris@11 417 accept = true;
Chris@11 418 } else if (peakProportion > m_prevprop * 2) {
Chris@11 419 accept = true;
Chris@11 420 }
Chris@11 421
Chris@11 422 return accept;
Chris@11 423 }
Chris@11 424
Chris@8 425 CepstrumPitchTracker::FeatureSet
Chris@8 426 CepstrumPitchTracker::process(const float *const *inputBuffers, Vamp::RealTime timestamp)
Chris@8 427 {
Chris@8 428 FeatureSet fs;
Chris@8 429
Chris@8 430 int bs = m_blockSize;
Chris@8 431 int hs = m_blockSize/2 + 1;
Chris@8 432
Chris@8 433 double *rawcep = new double[bs];
Chris@8 434 double *io = new double[bs];
Chris@8 435 double *logmag = new double[bs];
Chris@8 436
Chris@9 437 // The "inverse symmetric" method. Seems to be the most reliable
Chris@8 438
Chris@8 439 for (int i = 0; i < hs; ++i) {
Chris@8 440
Chris@8 441 double power =
Chris@8 442 inputBuffers[0][i*2 ] * inputBuffers[0][i*2 ] +
Chris@8 443 inputBuffers[0][i*2+1] * inputBuffers[0][i*2+1];
Chris@8 444 double mag = sqrt(power);
Chris@8 445
Chris@8 446 double lm = log(mag + 0.00000001);
Chris@8 447
Chris@9 448 logmag[i] = lm;
Chris@9 449 if (i > 0) logmag[bs - i] = lm;
Chris@8 450 }
Chris@8 451
Chris@9 452 fft(bs, true, logmag, 0, rawcep, io);
Chris@8 453
Chris@8 454 delete[] logmag;
Chris@8 455 delete[] io;
Chris@8 456
Chris@8 457 int n = m_bins;
Chris@8 458 double *data = new double[n];
Chris@8 459 filter(rawcep, data);
Chris@8 460 delete[] rawcep;
Chris@8 461
Chris@11 462 double abstot = 0.0;
Chris@11 463
Chris@11 464 for (int i = 0; i < n; ++i) {
Chris@11 465 abstot += fabs(data[i]);
Chris@11 466 }
Chris@11 467
Chris@8 468 double maxval = 0.0;
Chris@11 469 int maxbin = -1;
Chris@8 470
Chris@8 471 for (int i = 0; i < n; ++i) {
Chris@8 472 if (data[i] > maxval) {
Chris@8 473 maxval = data[i];
Chris@8 474 maxbin = i;
Chris@8 475 }
Chris@8 476 }
Chris@8 477
Chris@13 478 if (maxbin < 0) return fs;
Chris@13 479
Chris@13 480 double peakfreq = m_inputSampleRate / (maxbin + m_binFrom);
Chris@13 481 Hypothesis::Estimate e;
Chris@13 482 e.freq = peakfreq;
Chris@13 483 e.time = timestamp;
Chris@13 484
Chris@13 485 m_accepted.advanceTime();
Chris@16 486
Chris@13 487 for (int i = 0; i < m_possible.size(); ++i) {
Chris@13 488 m_possible[i].advanceTime();
Chris@13 489 }
Chris@13 490
Chris@16 491 if (!m_accepted.test(e)) {
Chris@18 492
Chris@16 493 int candidate = -1;
Chris@18 494 bool accepted = false;
Chris@18 495
Chris@16 496 for (int i = 0; i < m_possible.size(); ++i) {
Chris@16 497 if (m_possible[i].test(e)) {
Chris@18 498 accepted = true;
Chris@16 499 if (m_possible[i].getState() == Hypothesis::Satisfied) {
Chris@16 500 candidate = i;
Chris@16 501 }
Chris@16 502 break;
Chris@16 503 }
Chris@16 504 }
Chris@17 505
Chris@18 506 if (!accepted) {
Chris@18 507 Hypothesis h;
Chris@18 508 h.test(e); //!!! must succeed as h is new, so perhaps there should be a ctor for this
Chris@18 509 m_possible.push_back(h);
Chris@18 510 }
Chris@18 511
Chris@16 512 if (m_accepted.getState() == Hypothesis::Expired) {
Chris@16 513 m_accepted.addFeatures(fs[0]);
Chris@17 514 }
Chris@17 515
Chris@17 516 if (m_accepted.getState() == Hypothesis::Expired ||
Chris@17 517 m_accepted.getState() == Hypothesis::Rejected) {
Chris@16 518 if (candidate >= 0) {
Chris@16 519 m_accepted = m_possible[candidate];
Chris@16 520 } else {
Chris@16 521 m_accepted = Hypothesis();
Chris@16 522 }
Chris@16 523 }
Chris@13 524
Chris@19 525 // reap rejected/expired hypotheses from possible list
Chris@19 526 Hypotheses toReap = m_possible;
Chris@19 527 m_possible.clear();
Chris@19 528 for (int i = 0; i < toReap.size(); ++i) {
Chris@19 529 Hypothesis h = toReap[i];
Chris@19 530 if (h.getState() != Hypothesis::Rejected &&
Chris@19 531 h.getState() != Hypothesis::Expired) {
Chris@19 532 m_possible.push_back(h);
Chris@19 533 }
Chris@19 534 }
Chris@19 535 }
Chris@19 536
Chris@17 537 std::cerr << "accepted length = " << m_accepted.getPendingLength()
Chris@17 538 << ", state = " << m_accepted.getState()
Chris@17 539 << ", hypothesis count = " << m_possible.size() << std::endl;
Chris@17 540
Chris@16 541
Chris@13 542
Chris@13 543 /*
Chris@11 544 bool accepted = false;
Chris@11 545
Chris@11 546 if (maxbin >= 0) {
Chris@11 547 double pp = calculatePeakProportion(data, abstot, maxbin);
Chris@11 548 if (acceptPeak(maxbin, pp)) {
Chris@11 549 accepted = true;
Chris@11 550 } else {
Chris@11 551 // try a secondary peak
Chris@11 552 maxval = 0.0;
Chris@11 553 int secondbin = 0;
Chris@11 554 for (int i = 1; i < n-1; ++i) {
Chris@11 555 if (i != maxbin &&
Chris@11 556 data[i] > data[i-1] &&
Chris@11 557 data[i] > data[i+1] &&
Chris@11 558 data[i] > maxval) {
Chris@11 559 maxval = data[i];
Chris@11 560 secondbin = i;
Chris@11 561 }
Chris@11 562 }
Chris@11 563 double spp = calculatePeakProportion(data, abstot, secondbin);
Chris@11 564 if (acceptPeak(secondbin, spp)) {
Chris@11 565 maxbin = secondbin;
Chris@11 566 pp = spp;
Chris@11 567 accepted = true;
Chris@11 568 }
Chris@8 569 }
Chris@11 570 if (accepted) {
Chris@11 571 m_prevpeak = maxbin;
Chris@11 572 m_prevprop = pp;
Chris@8 573 }
Chris@8 574 }
Chris@13 575 */
Chris@8 576 // std::cerr << "peakProportion = " << peakProportion << std::endl;
Chris@8 577 // std::cerr << "peak = " << m_inputSampleRate / (maxbin + m_binFrom) << std::endl;
Chris@9 578 // std::cerr << "bins = " << m_bins << std::endl;
Chris@8 579
Chris@11 580 // if (peakProportion >= (0.00006 * m_bins)) {
Chris@16 581 /*
Chris@11 582 if (accepted) {
Chris@8 583 Feature f;
Chris@8 584 f.hasTimestamp = true;
Chris@8 585 f.timestamp = timestamp;
Chris@8 586 f.values.push_back(m_inputSampleRate / (maxbin + m_binFrom));
Chris@8 587 fs[0].push_back(f);
Chris@8 588 }
Chris@16 589 */
Chris@8 590 delete[] data;
Chris@8 591 return fs;
Chris@8 592 }
Chris@8 593
Chris@8 594 CepstrumPitchTracker::FeatureSet
Chris@8 595 CepstrumPitchTracker::getRemainingFeatures()
Chris@8 596 {
Chris@8 597 FeatureSet fs;
Chris@16 598 if (m_accepted.getState() != Hypothesis::New) {
Chris@16 599 m_accepted.addFeatures(fs[0]);
Chris@16 600 }
Chris@8 601 return fs;
Chris@8 602 }
Chris@8 603
Chris@8 604 void
Chris@8 605 CepstrumPitchTracker::fft(unsigned int n, bool inverse,
Chris@8 606 double *ri, double *ii, double *ro, double *io)
Chris@8 607 {
Chris@8 608 if (!ri || !ro || !io) return;
Chris@8 609
Chris@8 610 unsigned int bits;
Chris@8 611 unsigned int i, j, k, m;
Chris@8 612 unsigned int blockSize, blockEnd;
Chris@8 613
Chris@8 614 double tr, ti;
Chris@8 615
Chris@8 616 if (n < 2) return;
Chris@8 617 if (n & (n-1)) return;
Chris@8 618
Chris@8 619 double angle = 2.0 * M_PI;
Chris@8 620 if (inverse) angle = -angle;
Chris@8 621
Chris@8 622 for (i = 0; ; ++i) {
Chris@8 623 if (n & (1 << i)) {
Chris@8 624 bits = i;
Chris@8 625 break;
Chris@8 626 }
Chris@8 627 }
Chris@8 628
Chris@8 629 static unsigned int tableSize = 0;
Chris@8 630 static int *table = 0;
Chris@8 631
Chris@8 632 if (tableSize != n) {
Chris@8 633
Chris@8 634 delete[] table;
Chris@8 635
Chris@8 636 table = new int[n];
Chris@8 637
Chris@8 638 for (i = 0; i < n; ++i) {
Chris@8 639
Chris@8 640 m = i;
Chris@8 641
Chris@8 642 for (j = k = 0; j < bits; ++j) {
Chris@8 643 k = (k << 1) | (m & 1);
Chris@8 644 m >>= 1;
Chris@8 645 }
Chris@8 646
Chris@8 647 table[i] = k;
Chris@8 648 }
Chris@8 649
Chris@8 650 tableSize = n;
Chris@8 651 }
Chris@8 652
Chris@8 653 if (ii) {
Chris@8 654 for (i = 0; i < n; ++i) {
Chris@8 655 ro[table[i]] = ri[i];
Chris@8 656 io[table[i]] = ii[i];
Chris@8 657 }
Chris@8 658 } else {
Chris@8 659 for (i = 0; i < n; ++i) {
Chris@8 660 ro[table[i]] = ri[i];
Chris@8 661 io[table[i]] = 0.0;
Chris@8 662 }
Chris@8 663 }
Chris@8 664
Chris@8 665 blockEnd = 1;
Chris@8 666
Chris@8 667 for (blockSize = 2; blockSize <= n; blockSize <<= 1) {
Chris@8 668
Chris@8 669 double delta = angle / (double)blockSize;
Chris@8 670 double sm2 = -sin(-2 * delta);
Chris@8 671 double sm1 = -sin(-delta);
Chris@8 672 double cm2 = cos(-2 * delta);
Chris@8 673 double cm1 = cos(-delta);
Chris@8 674 double w = 2 * cm1;
Chris@8 675 double ar[3], ai[3];
Chris@8 676
Chris@8 677 for (i = 0; i < n; i += blockSize) {
Chris@8 678
Chris@8 679 ar[2] = cm2;
Chris@8 680 ar[1] = cm1;
Chris@8 681
Chris@8 682 ai[2] = sm2;
Chris@8 683 ai[1] = sm1;
Chris@8 684
Chris@8 685 for (j = i, m = 0; m < blockEnd; j++, m++) {
Chris@8 686
Chris@8 687 ar[0] = w * ar[1] - ar[2];
Chris@8 688 ar[2] = ar[1];
Chris@8 689 ar[1] = ar[0];
Chris@8 690
Chris@8 691 ai[0] = w * ai[1] - ai[2];
Chris@8 692 ai[2] = ai[1];
Chris@8 693 ai[1] = ai[0];
Chris@8 694
Chris@8 695 k = j + blockEnd;
Chris@8 696 tr = ar[0] * ro[k] - ai[0] * io[k];
Chris@8 697 ti = ar[0] * io[k] + ai[0] * ro[k];
Chris@8 698
Chris@8 699 ro[k] = ro[j] - tr;
Chris@8 700 io[k] = io[j] - ti;
Chris@8 701
Chris@8 702 ro[j] += tr;
Chris@8 703 io[j] += ti;
Chris@8 704 }
Chris@8 705 }
Chris@8 706
Chris@8 707 blockEnd = blockSize;
Chris@8 708 }
Chris@8 709 }
Chris@8 710
Chris@8 711