annotate CepstrumPitchTracker.cpp @ 23:1ae8041ae31b

Merge from branch "track"
author Chris Cannam
date Thu, 05 Jul 2012 08:29:20 +0100
parents a949c0278d7d
children a15d8c89a36e
rev   line source
Chris@8 1 /* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */
Chris@8 2 /*
Chris@8 3 Permission is hereby granted, free of charge, to any person
Chris@8 4 obtaining a copy of this software and associated documentation
Chris@8 5 files (the "Software"), to deal in the Software without
Chris@8 6 restriction, including without limitation the rights to use, copy,
Chris@8 7 modify, merge, publish, distribute, sublicense, and/or sell copies
Chris@8 8 of the Software, and to permit persons to whom the Software is
Chris@8 9 furnished to do so, subject to the following conditions:
Chris@8 10
Chris@8 11 The above copyright notice and this permission notice shall be
Chris@8 12 included in all copies or substantial portions of the Software.
Chris@8 13
Chris@8 14 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
Chris@8 15 EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
Chris@8 16 MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
Chris@8 17 NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS BE LIABLE FOR
Chris@8 18 ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF
Chris@8 19 CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
Chris@8 20 WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
Chris@8 21 */
Chris@8 22
Chris@8 23 #include "CepstrumPitchTracker.h"
Chris@8 24
Chris@8 25 #include <vector>
Chris@8 26 #include <algorithm>
Chris@8 27
Chris@8 28 #include <cstdio>
Chris@8 29 #include <cmath>
Chris@8 30 #include <complex>
Chris@8 31
Chris@8 32 using std::string;
Chris@12 33 using std::vector;
Chris@21 34 using Vamp::RealTime;
Chris@12 35
Chris@13 36 CepstrumPitchTracker::Hypothesis::Hypothesis()
Chris@12 37 {
Chris@13 38 m_state = New;
Chris@12 39 m_age = 0;
Chris@12 40 }
Chris@12 41
Chris@16 42 CepstrumPitchTracker::Hypothesis::~Hypothesis()
Chris@16 43 {
Chris@16 44 }
Chris@16 45
Chris@12 46 bool
Chris@12 47 CepstrumPitchTracker::Hypothesis::isWithinTolerance(Estimate s)
Chris@12 48 {
Chris@12 49 if (m_pending.empty()) {
Chris@12 50 return true;
Chris@12 51 }
Chris@21 52
Chris@21 53 // check we are within a relatively close tolerance of the last
Chris@21 54 // candidate
Chris@22 55 Estimate last = m_pending[m_pending.size()-1];
Chris@12 56 double r = s.freq / last.freq;
Chris@12 57 int cents = lrint(1200.0 * (log(r) / log(2.0)));
Chris@22 58 if (cents < -60 || cents > 60) return false;
Chris@21 59
Chris@22 60 // and within a slightly bigger tolerance of the current mean
Chris@22 61 double meanFreq = getMeanFrequency();
Chris@22 62 r = s.freq / meanFreq;
Chris@21 63 cents = lrint(1200.0 * (log(r) / log(2.0)));
Chris@21 64 if (cents < -80 || cents > 80) return false;
Chris@21 65
Chris@21 66 return true;
Chris@12 67 }
Chris@12 68
Chris@12 69 bool
Chris@12 70 CepstrumPitchTracker::Hypothesis::isSatisfied()
Chris@12 71 {
Chris@20 72 if (m_pending.empty()) return false;
Chris@20 73
Chris@20 74 double meanConfidence = 0.0;
Chris@20 75 for (int i = 0; i < m_pending.size(); ++i) {
Chris@20 76 meanConfidence += m_pending[i].confidence;
Chris@20 77 }
Chris@20 78 meanConfidence /= m_pending.size();
Chris@20 79
Chris@20 80 int lengthRequired = int(2.0 / meanConfidence + 0.5);
Chris@20 81 std::cerr << "meanConfidence = " << meanConfidence << ", lengthRequired = " << lengthRequired << ", length = " << m_pending.size() << std::endl;
Chris@20 82
Chris@20 83 return (m_pending.size() > lengthRequired);
Chris@12 84 }
Chris@12 85
Chris@13 86 void
Chris@13 87 CepstrumPitchTracker::Hypothesis::advanceTime()
Chris@13 88 {
Chris@13 89 ++m_age;
Chris@13 90 }
Chris@13 91
Chris@12 92 bool
Chris@12 93 CepstrumPitchTracker::Hypothesis::test(Estimate s)
Chris@12 94 {
Chris@13 95 bool accept = false;
Chris@13 96
Chris@13 97 switch (m_state) {
Chris@13 98
Chris@13 99 case New:
Chris@13 100 m_state = Provisional;
Chris@13 101 accept = true;
Chris@13 102 break;
Chris@13 103
Chris@13 104 case Provisional:
Chris@13 105 if (m_age > 3) {
Chris@13 106 m_state = Rejected;
Chris@13 107 } else if (isWithinTolerance(s)) {
Chris@13 108 accept = true;
Chris@13 109 }
Chris@13 110 break;
Chris@13 111
Chris@13 112 case Satisfied:
Chris@13 113 if (m_age > 3) {
Chris@13 114 m_state = Expired;
Chris@13 115 } else if (isWithinTolerance(s)) {
Chris@13 116 accept = true;
Chris@13 117 }
Chris@13 118 break;
Chris@13 119
Chris@13 120 case Rejected:
Chris@13 121 break;
Chris@13 122
Chris@13 123 case Expired:
Chris@13 124 break;
Chris@12 125 }
Chris@12 126
Chris@13 127 if (accept) {
Chris@13 128 m_pending.push_back(s);
Chris@13 129 m_age = 0;
Chris@13 130 if (m_state == Provisional && isSatisfied()) {
Chris@13 131 m_state = Satisfied;
Chris@12 132 }
Chris@12 133 }
Chris@12 134
Chris@19 135 return accept && (m_state == Satisfied);
Chris@13 136 }
Chris@12 137
Chris@12 138 CepstrumPitchTracker::Hypothesis::State
Chris@12 139 CepstrumPitchTracker::Hypothesis::getState()
Chris@12 140 {
Chris@12 141 return m_state;
Chris@12 142 }
Chris@12 143
Chris@17 144 int
Chris@17 145 CepstrumPitchTracker::Hypothesis::getPendingLength()
Chris@17 146 {
Chris@17 147 return m_pending.size();
Chris@17 148 }
Chris@17 149
Chris@12 150 CepstrumPitchTracker::Hypothesis::Estimates
Chris@12 151 CepstrumPitchTracker::Hypothesis::getAcceptedEstimates()
Chris@12 152 {
Chris@12 153 if (m_state == Satisfied || m_state == Expired) {
Chris@12 154 return m_pending;
Chris@12 155 } else {
Chris@12 156 return Estimates();
Chris@12 157 }
Chris@12 158 }
Chris@12 159
Chris@22 160 double
Chris@22 161 CepstrumPitchTracker::Hypothesis::getMeanFrequency()
Chris@22 162 {
Chris@22 163 double acc = 0.0;
Chris@22 164 for (int i = 0; i < m_pending.size(); ++i) {
Chris@22 165 acc += m_pending[i].freq;
Chris@22 166 }
Chris@22 167 acc /= m_pending.size();
Chris@22 168 return acc;
Chris@22 169 }
Chris@22 170
Chris@21 171 CepstrumPitchTracker::Hypothesis::Note
Chris@21 172 CepstrumPitchTracker::Hypothesis::getAveragedNote()
Chris@21 173 {
Chris@21 174 Note n;
Chris@21 175
Chris@21 176 if (!(m_state == Satisfied || m_state == Expired)) {
Chris@21 177 n.freq = 0.0;
Chris@21 178 n.time = RealTime::zeroTime;
Chris@21 179 n.duration = RealTime::zeroTime;
Chris@21 180 return n;
Chris@21 181 }
Chris@21 182
Chris@21 183 n.time = m_pending.begin()->time;
Chris@21 184
Chris@21 185 Estimates::iterator i = m_pending.end();
Chris@21 186 --i;
Chris@21 187 n.duration = i->time - n.time;
Chris@21 188
Chris@22 189 // just mean frequency for now, but this isn't at all right perceptually
Chris@22 190 n.freq = getMeanFrequency();
Chris@21 191
Chris@21 192 return n;
Chris@21 193 }
Chris@21 194
Chris@16 195 void
Chris@21 196 CepstrumPitchTracker::Hypothesis::addFeatures(FeatureSet &fs)
Chris@16 197 {
Chris@16 198 for (int i = 0; i < m_pending.size(); ++i) {
Chris@16 199 Feature f;
Chris@16 200 f.hasTimestamp = true;
Chris@16 201 f.timestamp = m_pending[i].time;
Chris@16 202 f.values.push_back(m_pending[i].freq);
Chris@21 203 fs[0].push_back(f);
Chris@16 204 }
Chris@21 205
Chris@21 206 Feature nf;
Chris@21 207 nf.hasTimestamp = true;
Chris@21 208 nf.hasDuration = true;
Chris@21 209 Note n = getAveragedNote();
Chris@21 210 nf.timestamp = n.time;
Chris@21 211 nf.duration = n.duration;
Chris@21 212 nf.values.push_back(n.freq);
Chris@21 213 fs[1].push_back(nf);
Chris@16 214 }
Chris@8 215
Chris@8 216 CepstrumPitchTracker::CepstrumPitchTracker(float inputSampleRate) :
Chris@8 217 Plugin(inputSampleRate),
Chris@8 218 m_channels(0),
Chris@8 219 m_stepSize(256),
Chris@8 220 m_blockSize(1024),
Chris@8 221 m_fmin(50),
Chris@8 222 m_fmax(1000),
Chris@10 223 m_vflen(3),
Chris@8 224 m_binFrom(0),
Chris@8 225 m_binTo(0),
Chris@20 226 m_bins(0)
Chris@8 227 {
Chris@8 228 }
Chris@8 229
Chris@8 230 CepstrumPitchTracker::~CepstrumPitchTracker()
Chris@8 231 {
Chris@8 232 }
Chris@8 233
Chris@8 234 string
Chris@8 235 CepstrumPitchTracker::getIdentifier() const
Chris@8 236 {
Chris@8 237 return "cepstrum-pitch";
Chris@8 238 }
Chris@8 239
Chris@8 240 string
Chris@8 241 CepstrumPitchTracker::getName() const
Chris@8 242 {
Chris@8 243 return "Cepstrum Pitch Tracker";
Chris@8 244 }
Chris@8 245
Chris@8 246 string
Chris@8 247 CepstrumPitchTracker::getDescription() const
Chris@8 248 {
Chris@8 249 return "Estimate f0 of monophonic material using a cepstrum method.";
Chris@8 250 }
Chris@8 251
Chris@8 252 string
Chris@8 253 CepstrumPitchTracker::getMaker() const
Chris@8 254 {
Chris@8 255 return "Chris Cannam";
Chris@8 256 }
Chris@8 257
Chris@8 258 int
Chris@8 259 CepstrumPitchTracker::getPluginVersion() const
Chris@8 260 {
Chris@8 261 // Increment this each time you release a version that behaves
Chris@8 262 // differently from the previous one
Chris@8 263 return 1;
Chris@8 264 }
Chris@8 265
Chris@8 266 string
Chris@8 267 CepstrumPitchTracker::getCopyright() const
Chris@8 268 {
Chris@8 269 return "Freely redistributable (BSD license)";
Chris@8 270 }
Chris@8 271
Chris@8 272 CepstrumPitchTracker::InputDomain
Chris@8 273 CepstrumPitchTracker::getInputDomain() const
Chris@8 274 {
Chris@8 275 return FrequencyDomain;
Chris@8 276 }
Chris@8 277
Chris@8 278 size_t
Chris@8 279 CepstrumPitchTracker::getPreferredBlockSize() const
Chris@8 280 {
Chris@8 281 return 1024;
Chris@8 282 }
Chris@8 283
Chris@8 284 size_t
Chris@8 285 CepstrumPitchTracker::getPreferredStepSize() const
Chris@8 286 {
Chris@8 287 return 256;
Chris@8 288 }
Chris@8 289
Chris@8 290 size_t
Chris@8 291 CepstrumPitchTracker::getMinChannelCount() const
Chris@8 292 {
Chris@8 293 return 1;
Chris@8 294 }
Chris@8 295
Chris@8 296 size_t
Chris@8 297 CepstrumPitchTracker::getMaxChannelCount() const
Chris@8 298 {
Chris@8 299 return 1;
Chris@8 300 }
Chris@8 301
Chris@8 302 CepstrumPitchTracker::ParameterList
Chris@8 303 CepstrumPitchTracker::getParameterDescriptors() const
Chris@8 304 {
Chris@8 305 ParameterList list;
Chris@8 306 return list;
Chris@8 307 }
Chris@8 308
Chris@8 309 float
Chris@8 310 CepstrumPitchTracker::getParameter(string identifier) const
Chris@8 311 {
Chris@8 312 return 0.f;
Chris@8 313 }
Chris@8 314
Chris@8 315 void
Chris@8 316 CepstrumPitchTracker::setParameter(string identifier, float value)
Chris@8 317 {
Chris@8 318 }
Chris@8 319
Chris@8 320 CepstrumPitchTracker::ProgramList
Chris@8 321 CepstrumPitchTracker::getPrograms() const
Chris@8 322 {
Chris@8 323 ProgramList list;
Chris@8 324 return list;
Chris@8 325 }
Chris@8 326
Chris@8 327 string
Chris@8 328 CepstrumPitchTracker::getCurrentProgram() const
Chris@8 329 {
Chris@8 330 return ""; // no programs
Chris@8 331 }
Chris@8 332
Chris@8 333 void
Chris@8 334 CepstrumPitchTracker::selectProgram(string name)
Chris@8 335 {
Chris@8 336 }
Chris@8 337
Chris@8 338 CepstrumPitchTracker::OutputList
Chris@8 339 CepstrumPitchTracker::getOutputDescriptors() const
Chris@8 340 {
Chris@8 341 OutputList outputs;
Chris@8 342
Chris@8 343 int n = 0;
Chris@8 344
Chris@8 345 OutputDescriptor d;
Chris@8 346
Chris@8 347 d.identifier = "f0";
Chris@8 348 d.name = "Estimated f0";
Chris@8 349 d.description = "Estimated fundamental frequency";
Chris@8 350 d.unit = "Hz";
Chris@8 351 d.hasFixedBinCount = true;
Chris@8 352 d.binCount = 1;
Chris@8 353 d.hasKnownExtents = true;
Chris@8 354 d.minValue = m_fmin;
Chris@8 355 d.maxValue = m_fmax;
Chris@8 356 d.isQuantized = false;
Chris@8 357 d.sampleType = OutputDescriptor::FixedSampleRate;
Chris@8 358 d.sampleRate = (m_inputSampleRate / m_stepSize);
Chris@8 359 d.hasDuration = false;
Chris@8 360 outputs.push_back(d);
Chris@8 361
Chris@21 362 d.identifier = "notes";
Chris@21 363 d.name = "Notes";
Chris@21 364 d.description = "Derived fixed-pitch note frequencies";
Chris@21 365 d.unit = "Hz";
Chris@21 366 d.hasFixedBinCount = true;
Chris@21 367 d.binCount = 1;
Chris@21 368 d.hasKnownExtents = true;
Chris@21 369 d.minValue = m_fmin;
Chris@21 370 d.maxValue = m_fmax;
Chris@21 371 d.isQuantized = false;
Chris@21 372 d.sampleType = OutputDescriptor::FixedSampleRate;
Chris@21 373 d.sampleRate = (m_inputSampleRate / m_stepSize);
Chris@21 374 d.hasDuration = true;
Chris@21 375 outputs.push_back(d);
Chris@21 376
Chris@8 377 return outputs;
Chris@8 378 }
Chris@8 379
Chris@8 380 bool
Chris@8 381 CepstrumPitchTracker::initialise(size_t channels, size_t stepSize, size_t blockSize)
Chris@8 382 {
Chris@8 383 if (channels < getMinChannelCount() ||
Chris@8 384 channels > getMaxChannelCount()) return false;
Chris@8 385
Chris@8 386 // std::cerr << "CepstrumPitchTracker::initialise: channels = " << channels
Chris@8 387 // << ", stepSize = " << stepSize << ", blockSize = " << blockSize
Chris@8 388 // << std::endl;
Chris@8 389
Chris@8 390 m_channels = channels;
Chris@8 391 m_stepSize = stepSize;
Chris@8 392 m_blockSize = blockSize;
Chris@8 393
Chris@8 394 m_binFrom = int(m_inputSampleRate / m_fmax);
Chris@8 395 m_binTo = int(m_inputSampleRate / m_fmin);
Chris@8 396
Chris@8 397 if (m_binTo >= (int)m_blockSize / 2) {
Chris@8 398 m_binTo = m_blockSize / 2 - 1;
Chris@8 399 }
Chris@8 400
Chris@8 401 m_bins = (m_binTo - m_binFrom) + 1;
Chris@8 402
Chris@8 403 reset();
Chris@8 404
Chris@8 405 return true;
Chris@8 406 }
Chris@8 407
Chris@8 408 void
Chris@8 409 CepstrumPitchTracker::reset()
Chris@8 410 {
Chris@8 411 }
Chris@8 412
Chris@8 413 void
Chris@20 414 CepstrumPitchTracker::filter(const double *cep, double *data)
Chris@8 415 {
Chris@8 416 for (int i = 0; i < m_bins; ++i) {
Chris@10 417 double v = 0;
Chris@10 418 int n = 0;
Chris@10 419 // average according to the vertical filter length
Chris@10 420 for (int j = -m_vflen/2; j <= m_vflen/2; ++j) {
Chris@10 421 int ix = i + m_binFrom + j;
Chris@10 422 if (ix >= 0 && ix < m_blockSize) {
Chris@10 423 v += cep[ix];
Chris@10 424 ++n;
Chris@10 425 }
Chris@10 426 }
Chris@20 427 data[i] = v / n;
Chris@8 428 }
Chris@11 429 }
Chris@11 430
Chris@8 431 CepstrumPitchTracker::FeatureSet
Chris@21 432 CepstrumPitchTracker::process(const float *const *inputBuffers, RealTime timestamp)
Chris@8 433 {
Chris@8 434 FeatureSet fs;
Chris@8 435
Chris@8 436 int bs = m_blockSize;
Chris@8 437 int hs = m_blockSize/2 + 1;
Chris@8 438
Chris@8 439 double *rawcep = new double[bs];
Chris@8 440 double *io = new double[bs];
Chris@8 441 double *logmag = new double[bs];
Chris@8 442
Chris@9 443 // The "inverse symmetric" method. Seems to be the most reliable
Chris@8 444
Chris@8 445 for (int i = 0; i < hs; ++i) {
Chris@8 446
Chris@8 447 double power =
Chris@8 448 inputBuffers[0][i*2 ] * inputBuffers[0][i*2 ] +
Chris@8 449 inputBuffers[0][i*2+1] * inputBuffers[0][i*2+1];
Chris@8 450 double mag = sqrt(power);
Chris@8 451
Chris@8 452 double lm = log(mag + 0.00000001);
Chris@8 453
Chris@9 454 logmag[i] = lm;
Chris@9 455 if (i > 0) logmag[bs - i] = lm;
Chris@8 456 }
Chris@8 457
Chris@9 458 fft(bs, true, logmag, 0, rawcep, io);
Chris@8 459
Chris@8 460 delete[] logmag;
Chris@8 461 delete[] io;
Chris@8 462
Chris@8 463 int n = m_bins;
Chris@8 464 double *data = new double[n];
Chris@8 465 filter(rawcep, data);
Chris@8 466 delete[] rawcep;
Chris@8 467
Chris@11 468 double abstot = 0.0;
Chris@11 469
Chris@11 470 for (int i = 0; i < n; ++i) {
Chris@11 471 abstot += fabs(data[i]);
Chris@11 472 }
Chris@11 473
Chris@8 474 double maxval = 0.0;
Chris@11 475 int maxbin = -1;
Chris@8 476
Chris@8 477 for (int i = 0; i < n; ++i) {
Chris@8 478 if (data[i] > maxval) {
Chris@8 479 maxval = data[i];
Chris@8 480 maxbin = i;
Chris@8 481 }
Chris@8 482 }
Chris@8 483
Chris@20 484 if (maxbin < 0) {
Chris@20 485 delete[] data;
Chris@20 486 return fs;
Chris@20 487 }
Chris@20 488
Chris@20 489 double nextPeakVal = 0.0;
Chris@20 490 for (int i = 1; i+1 < n; ++i) {
Chris@20 491 if (data[i] > data[i-1] &&
Chris@20 492 data[i] > data[i+1] &&
Chris@20 493 i != maxbin &&
Chris@20 494 data[i] > nextPeakVal) {
Chris@20 495 nextPeakVal = data[i];
Chris@20 496 }
Chris@20 497 }
Chris@13 498
Chris@13 499 double peakfreq = m_inputSampleRate / (maxbin + m_binFrom);
Chris@20 500
Chris@20 501 double confidence = 0.0;
Chris@20 502 if (nextPeakVal != 0.0) {
Chris@20 503 confidence = ((maxval / nextPeakVal) - 1.0) / 4.0;
Chris@20 504 if (confidence > 1.0) confidence = 1.0;
Chris@20 505 }
Chris@20 506
Chris@13 507 Hypothesis::Estimate e;
Chris@13 508 e.freq = peakfreq;
Chris@13 509 e.time = timestamp;
Chris@20 510 e.confidence = confidence;
Chris@13 511
Chris@13 512 m_accepted.advanceTime();
Chris@16 513
Chris@13 514 for (int i = 0; i < m_possible.size(); ++i) {
Chris@13 515 m_possible[i].advanceTime();
Chris@13 516 }
Chris@13 517
Chris@16 518 if (!m_accepted.test(e)) {
Chris@18 519
Chris@16 520 int candidate = -1;
Chris@18 521 bool accepted = false;
Chris@18 522
Chris@16 523 for (int i = 0; i < m_possible.size(); ++i) {
Chris@16 524 if (m_possible[i].test(e)) {
Chris@18 525 accepted = true;
Chris@16 526 if (m_possible[i].getState() == Hypothesis::Satisfied) {
Chris@16 527 candidate = i;
Chris@16 528 }
Chris@16 529 break;
Chris@16 530 }
Chris@16 531 }
Chris@17 532
Chris@18 533 if (!accepted) {
Chris@18 534 Hypothesis h;
Chris@18 535 h.test(e); //!!! must succeed as h is new, so perhaps there should be a ctor for this
Chris@18 536 m_possible.push_back(h);
Chris@18 537 }
Chris@18 538
Chris@16 539 if (m_accepted.getState() == Hypothesis::Expired) {
Chris@21 540 m_accepted.addFeatures(fs);
Chris@17 541 }
Chris@17 542
Chris@17 543 if (m_accepted.getState() == Hypothesis::Expired ||
Chris@17 544 m_accepted.getState() == Hypothesis::Rejected) {
Chris@16 545 if (candidate >= 0) {
Chris@16 546 m_accepted = m_possible[candidate];
Chris@16 547 } else {
Chris@16 548 m_accepted = Hypothesis();
Chris@16 549 }
Chris@16 550 }
Chris@13 551
Chris@19 552 // reap rejected/expired hypotheses from possible list
Chris@19 553 Hypotheses toReap = m_possible;
Chris@19 554 m_possible.clear();
Chris@19 555 for (int i = 0; i < toReap.size(); ++i) {
Chris@19 556 Hypothesis h = toReap[i];
Chris@19 557 if (h.getState() != Hypothesis::Rejected &&
Chris@19 558 h.getState() != Hypothesis::Expired) {
Chris@19 559 m_possible.push_back(h);
Chris@19 560 }
Chris@19 561 }
Chris@19 562 }
Chris@19 563
Chris@20 564 std::cerr << "accepted length = " << m_accepted.getPendingLength()
Chris@20 565 << ", state = " << m_accepted.getState()
Chris@20 566 << ", hypothesis count = " << m_possible.size() << std::endl;
Chris@17 567
Chris@8 568 delete[] data;
Chris@8 569 return fs;
Chris@8 570 }
Chris@8 571
Chris@8 572 CepstrumPitchTracker::FeatureSet
Chris@8 573 CepstrumPitchTracker::getRemainingFeatures()
Chris@8 574 {
Chris@8 575 FeatureSet fs;
Chris@20 576 if (m_accepted.getState() == Hypothesis::Satisfied) {
Chris@21 577 m_accepted.addFeatures(fs);
Chris@16 578 }
Chris@8 579 return fs;
Chris@8 580 }
Chris@8 581
Chris@8 582 void
Chris@8 583 CepstrumPitchTracker::fft(unsigned int n, bool inverse,
Chris@8 584 double *ri, double *ii, double *ro, double *io)
Chris@8 585 {
Chris@8 586 if (!ri || !ro || !io) return;
Chris@8 587
Chris@8 588 unsigned int bits;
Chris@8 589 unsigned int i, j, k, m;
Chris@8 590 unsigned int blockSize, blockEnd;
Chris@8 591
Chris@8 592 double tr, ti;
Chris@8 593
Chris@8 594 if (n < 2) return;
Chris@8 595 if (n & (n-1)) return;
Chris@8 596
Chris@8 597 double angle = 2.0 * M_PI;
Chris@8 598 if (inverse) angle = -angle;
Chris@8 599
Chris@8 600 for (i = 0; ; ++i) {
Chris@8 601 if (n & (1 << i)) {
Chris@8 602 bits = i;
Chris@8 603 break;
Chris@8 604 }
Chris@8 605 }
Chris@8 606
Chris@8 607 static unsigned int tableSize = 0;
Chris@8 608 static int *table = 0;
Chris@8 609
Chris@8 610 if (tableSize != n) {
Chris@8 611
Chris@8 612 delete[] table;
Chris@8 613
Chris@8 614 table = new int[n];
Chris@8 615
Chris@8 616 for (i = 0; i < n; ++i) {
Chris@8 617
Chris@8 618 m = i;
Chris@8 619
Chris@8 620 for (j = k = 0; j < bits; ++j) {
Chris@8 621 k = (k << 1) | (m & 1);
Chris@8 622 m >>= 1;
Chris@8 623 }
Chris@8 624
Chris@8 625 table[i] = k;
Chris@8 626 }
Chris@8 627
Chris@8 628 tableSize = n;
Chris@8 629 }
Chris@8 630
Chris@8 631 if (ii) {
Chris@8 632 for (i = 0; i < n; ++i) {
Chris@8 633 ro[table[i]] = ri[i];
Chris@8 634 io[table[i]] = ii[i];
Chris@8 635 }
Chris@8 636 } else {
Chris@8 637 for (i = 0; i < n; ++i) {
Chris@8 638 ro[table[i]] = ri[i];
Chris@8 639 io[table[i]] = 0.0;
Chris@8 640 }
Chris@8 641 }
Chris@8 642
Chris@8 643 blockEnd = 1;
Chris@8 644
Chris@8 645 for (blockSize = 2; blockSize <= n; blockSize <<= 1) {
Chris@8 646
Chris@8 647 double delta = angle / (double)blockSize;
Chris@8 648 double sm2 = -sin(-2 * delta);
Chris@8 649 double sm1 = -sin(-delta);
Chris@8 650 double cm2 = cos(-2 * delta);
Chris@8 651 double cm1 = cos(-delta);
Chris@8 652 double w = 2 * cm1;
Chris@8 653 double ar[3], ai[3];
Chris@8 654
Chris@8 655 for (i = 0; i < n; i += blockSize) {
Chris@8 656
Chris@8 657 ar[2] = cm2;
Chris@8 658 ar[1] = cm1;
Chris@8 659
Chris@8 660 ai[2] = sm2;
Chris@8 661 ai[1] = sm1;
Chris@8 662
Chris@8 663 for (j = i, m = 0; m < blockEnd; j++, m++) {
Chris@8 664
Chris@8 665 ar[0] = w * ar[1] - ar[2];
Chris@8 666 ar[2] = ar[1];
Chris@8 667 ar[1] = ar[0];
Chris@8 668
Chris@8 669 ai[0] = w * ai[1] - ai[2];
Chris@8 670 ai[2] = ai[1];
Chris@8 671 ai[1] = ai[0];
Chris@8 672
Chris@8 673 k = j + blockEnd;
Chris@8 674 tr = ar[0] * ro[k] - ai[0] * io[k];
Chris@8 675 ti = ar[0] * io[k] + ai[0] * ro[k];
Chris@8 676
Chris@8 677 ro[k] = ro[j] - tr;
Chris@8 678 io[k] = io[j] - ti;
Chris@8 679
Chris@8 680 ro[j] += tr;
Chris@8 681 io[j] += ti;
Chris@8 682 }
Chris@8 683 }
Chris@8 684
Chris@8 685 blockEnd = blockSize;
Chris@8 686 }
Chris@8 687 }
Chris@8 688
Chris@8 689