annotate CepstrumPitchTracker.cpp @ 23:0e67ed2777e9

Thread safety
author Chris Cannam
date Mon, 09 Jul 2012 22:32:14 +0100
parents 0a0e449a6069
children 0c45cca1e4fd
rev   line source
Chris@3 1 /* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */
Chris@3 2 /*
Chris@3 3 Permission is hereby granted, free of charge, to any person
Chris@3 4 obtaining a copy of this software and associated documentation
Chris@3 5 files (the "Software"), to deal in the Software without
Chris@3 6 restriction, including without limitation the rights to use, copy,
Chris@3 7 modify, merge, publish, distribute, sublicense, and/or sell copies
Chris@3 8 of the Software, and to permit persons to whom the Software is
Chris@3 9 furnished to do so, subject to the following conditions:
Chris@3 10
Chris@3 11 The above copyright notice and this permission notice shall be
Chris@3 12 included in all copies or substantial portions of the Software.
Chris@3 13
Chris@3 14 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
Chris@3 15 EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
Chris@3 16 MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
Chris@3 17 NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS BE LIABLE FOR
Chris@3 18 ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF
Chris@3 19 CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
Chris@3 20 WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
Chris@3 21 */
Chris@3 22
Chris@3 23 #include "CepstrumPitchTracker.h"
Chris@3 24
Chris@3 25 #include <vector>
Chris@3 26 #include <algorithm>
Chris@3 27
Chris@3 28 #include <cstdio>
Chris@3 29 #include <cmath>
Chris@3 30 #include <complex>
Chris@3 31
Chris@3 32 using std::string;
Chris@7 33 using std::vector;
Chris@16 34 using Vamp::RealTime;
Chris@7 35
Chris@8 36 CepstrumPitchTracker::Hypothesis::Hypothesis()
Chris@7 37 {
Chris@8 38 m_state = New;
Chris@7 39 m_age = 0;
Chris@7 40 }
Chris@7 41
Chris@11 42 CepstrumPitchTracker::Hypothesis::~Hypothesis()
Chris@11 43 {
Chris@11 44 }
Chris@11 45
Chris@7 46 bool
Chris@7 47 CepstrumPitchTracker::Hypothesis::isWithinTolerance(Estimate s)
Chris@7 48 {
Chris@7 49 if (m_pending.empty()) {
Chris@7 50 return true;
Chris@7 51 }
Chris@16 52
Chris@16 53 // check we are within a relatively close tolerance of the last
Chris@16 54 // candidate
Chris@17 55 Estimate last = m_pending[m_pending.size()-1];
Chris@7 56 double r = s.freq / last.freq;
Chris@7 57 int cents = lrint(1200.0 * (log(r) / log(2.0)));
Chris@17 58 if (cents < -60 || cents > 60) return false;
Chris@16 59
Chris@17 60 // and within a slightly bigger tolerance of the current mean
Chris@17 61 double meanFreq = getMeanFrequency();
Chris@17 62 r = s.freq / meanFreq;
Chris@16 63 cents = lrint(1200.0 * (log(r) / log(2.0)));
Chris@16 64 if (cents < -80 || cents > 80) return false;
Chris@16 65
Chris@16 66 return true;
Chris@7 67 }
Chris@7 68
Chris@7 69 bool
Chris@7 70 CepstrumPitchTracker::Hypothesis::isSatisfied()
Chris@7 71 {
Chris@15 72 if (m_pending.empty()) return false;
Chris@15 73
Chris@15 74 double meanConfidence = 0.0;
Chris@15 75 for (int i = 0; i < m_pending.size(); ++i) {
Chris@15 76 meanConfidence += m_pending[i].confidence;
Chris@15 77 }
Chris@15 78 meanConfidence /= m_pending.size();
Chris@15 79
Chris@15 80 int lengthRequired = int(2.0 / meanConfidence + 0.5);
Chris@15 81 std::cerr << "meanConfidence = " << meanConfidence << ", lengthRequired = " << lengthRequired << ", length = " << m_pending.size() << std::endl;
Chris@15 82
Chris@15 83 return (m_pending.size() > lengthRequired);
Chris@7 84 }
Chris@7 85
Chris@8 86 void
Chris@8 87 CepstrumPitchTracker::Hypothesis::advanceTime()
Chris@8 88 {
Chris@8 89 ++m_age;
Chris@8 90 }
Chris@8 91
Chris@7 92 bool
Chris@7 93 CepstrumPitchTracker::Hypothesis::test(Estimate s)
Chris@7 94 {
Chris@8 95 bool accept = false;
Chris@8 96
Chris@8 97 switch (m_state) {
Chris@8 98
Chris@8 99 case New:
Chris@8 100 m_state = Provisional;
Chris@8 101 accept = true;
Chris@8 102 break;
Chris@8 103
Chris@8 104 case Provisional:
Chris@8 105 if (m_age > 3) {
Chris@8 106 m_state = Rejected;
Chris@8 107 } else if (isWithinTolerance(s)) {
Chris@8 108 accept = true;
Chris@8 109 }
Chris@8 110 break;
Chris@8 111
Chris@8 112 case Satisfied:
Chris@8 113 if (m_age > 3) {
Chris@8 114 m_state = Expired;
Chris@8 115 } else if (isWithinTolerance(s)) {
Chris@8 116 accept = true;
Chris@8 117 }
Chris@8 118 break;
Chris@8 119
Chris@8 120 case Rejected:
Chris@8 121 break;
Chris@8 122
Chris@8 123 case Expired:
Chris@8 124 break;
Chris@7 125 }
Chris@7 126
Chris@8 127 if (accept) {
Chris@8 128 m_pending.push_back(s);
Chris@8 129 m_age = 0;
Chris@8 130 if (m_state == Provisional && isSatisfied()) {
Chris@8 131 m_state = Satisfied;
Chris@7 132 }
Chris@7 133 }
Chris@7 134
Chris@14 135 return accept && (m_state == Satisfied);
Chris@8 136 }
Chris@7 137
Chris@7 138 CepstrumPitchTracker::Hypothesis::State
Chris@7 139 CepstrumPitchTracker::Hypothesis::getState()
Chris@7 140 {
Chris@7 141 return m_state;
Chris@7 142 }
Chris@7 143
Chris@12 144 int
Chris@12 145 CepstrumPitchTracker::Hypothesis::getPendingLength()
Chris@12 146 {
Chris@12 147 return m_pending.size();
Chris@12 148 }
Chris@12 149
Chris@7 150 CepstrumPitchTracker::Hypothesis::Estimates
Chris@7 151 CepstrumPitchTracker::Hypothesis::getAcceptedEstimates()
Chris@7 152 {
Chris@7 153 if (m_state == Satisfied || m_state == Expired) {
Chris@7 154 return m_pending;
Chris@7 155 } else {
Chris@7 156 return Estimates();
Chris@7 157 }
Chris@7 158 }
Chris@7 159
Chris@17 160 double
Chris@17 161 CepstrumPitchTracker::Hypothesis::getMeanFrequency()
Chris@17 162 {
Chris@17 163 double acc = 0.0;
Chris@17 164 for (int i = 0; i < m_pending.size(); ++i) {
Chris@17 165 acc += m_pending[i].freq;
Chris@17 166 }
Chris@17 167 acc /= m_pending.size();
Chris@17 168 return acc;
Chris@17 169 }
Chris@17 170
Chris@16 171 CepstrumPitchTracker::Hypothesis::Note
Chris@16 172 CepstrumPitchTracker::Hypothesis::getAveragedNote()
Chris@16 173 {
Chris@16 174 Note n;
Chris@16 175
Chris@16 176 if (!(m_state == Satisfied || m_state == Expired)) {
Chris@16 177 n.freq = 0.0;
Chris@16 178 n.time = RealTime::zeroTime;
Chris@16 179 n.duration = RealTime::zeroTime;
Chris@16 180 return n;
Chris@16 181 }
Chris@16 182
Chris@16 183 n.time = m_pending.begin()->time;
Chris@16 184
Chris@16 185 Estimates::iterator i = m_pending.end();
Chris@16 186 --i;
Chris@16 187 n.duration = i->time - n.time;
Chris@16 188
Chris@17 189 // just mean frequency for now, but this isn't at all right perceptually
Chris@17 190 n.freq = getMeanFrequency();
Chris@16 191
Chris@16 192 return n;
Chris@16 193 }
Chris@16 194
Chris@11 195 void
Chris@16 196 CepstrumPitchTracker::Hypothesis::addFeatures(FeatureSet &fs)
Chris@11 197 {
Chris@11 198 for (int i = 0; i < m_pending.size(); ++i) {
Chris@11 199 Feature f;
Chris@11 200 f.hasTimestamp = true;
Chris@11 201 f.timestamp = m_pending[i].time;
Chris@11 202 f.values.push_back(m_pending[i].freq);
Chris@16 203 fs[0].push_back(f);
Chris@11 204 }
Chris@16 205
Chris@16 206 Feature nf;
Chris@16 207 nf.hasTimestamp = true;
Chris@16 208 nf.hasDuration = true;
Chris@16 209 Note n = getAveragedNote();
Chris@16 210 nf.timestamp = n.time;
Chris@16 211 nf.duration = n.duration;
Chris@16 212 nf.values.push_back(n.freq);
Chris@16 213 fs[1].push_back(nf);
Chris@11 214 }
Chris@3 215
Chris@3 216 CepstrumPitchTracker::CepstrumPitchTracker(float inputSampleRate) :
Chris@3 217 Plugin(inputSampleRate),
Chris@3 218 m_channels(0),
Chris@3 219 m_stepSize(256),
Chris@3 220 m_blockSize(1024),
Chris@3 221 m_fmin(50),
Chris@3 222 m_fmax(1000),
Chris@18 223 m_vflen(1),
Chris@3 224 m_binFrom(0),
Chris@3 225 m_binTo(0),
Chris@15 226 m_bins(0)
Chris@3 227 {
Chris@3 228 }
Chris@3 229
Chris@3 230 CepstrumPitchTracker::~CepstrumPitchTracker()
Chris@3 231 {
Chris@3 232 }
Chris@3 233
Chris@3 234 string
Chris@3 235 CepstrumPitchTracker::getIdentifier() const
Chris@3 236 {
Chris@3 237 return "cepstrum-pitch";
Chris@3 238 }
Chris@3 239
Chris@3 240 string
Chris@3 241 CepstrumPitchTracker::getName() const
Chris@3 242 {
Chris@3 243 return "Cepstrum Pitch Tracker";
Chris@3 244 }
Chris@3 245
Chris@3 246 string
Chris@3 247 CepstrumPitchTracker::getDescription() const
Chris@3 248 {
Chris@3 249 return "Estimate f0 of monophonic material using a cepstrum method.";
Chris@3 250 }
Chris@3 251
Chris@3 252 string
Chris@3 253 CepstrumPitchTracker::getMaker() const
Chris@3 254 {
Chris@3 255 return "Chris Cannam";
Chris@3 256 }
Chris@3 257
Chris@3 258 int
Chris@3 259 CepstrumPitchTracker::getPluginVersion() const
Chris@3 260 {
Chris@3 261 // Increment this each time you release a version that behaves
Chris@3 262 // differently from the previous one
Chris@3 263 return 1;
Chris@3 264 }
Chris@3 265
Chris@3 266 string
Chris@3 267 CepstrumPitchTracker::getCopyright() const
Chris@3 268 {
Chris@3 269 return "Freely redistributable (BSD license)";
Chris@3 270 }
Chris@3 271
Chris@3 272 CepstrumPitchTracker::InputDomain
Chris@3 273 CepstrumPitchTracker::getInputDomain() const
Chris@3 274 {
Chris@3 275 return FrequencyDomain;
Chris@3 276 }
Chris@3 277
Chris@3 278 size_t
Chris@3 279 CepstrumPitchTracker::getPreferredBlockSize() const
Chris@3 280 {
Chris@3 281 return 1024;
Chris@3 282 }
Chris@3 283
Chris@3 284 size_t
Chris@3 285 CepstrumPitchTracker::getPreferredStepSize() const
Chris@3 286 {
Chris@3 287 return 256;
Chris@3 288 }
Chris@3 289
Chris@3 290 size_t
Chris@3 291 CepstrumPitchTracker::getMinChannelCount() const
Chris@3 292 {
Chris@3 293 return 1;
Chris@3 294 }
Chris@3 295
Chris@3 296 size_t
Chris@3 297 CepstrumPitchTracker::getMaxChannelCount() const
Chris@3 298 {
Chris@3 299 return 1;
Chris@3 300 }
Chris@3 301
Chris@3 302 CepstrumPitchTracker::ParameterList
Chris@3 303 CepstrumPitchTracker::getParameterDescriptors() const
Chris@3 304 {
Chris@3 305 ParameterList list;
Chris@3 306 return list;
Chris@3 307 }
Chris@3 308
Chris@3 309 float
Chris@3 310 CepstrumPitchTracker::getParameter(string identifier) const
Chris@3 311 {
Chris@3 312 return 0.f;
Chris@3 313 }
Chris@3 314
Chris@3 315 void
Chris@3 316 CepstrumPitchTracker::setParameter(string identifier, float value)
Chris@3 317 {
Chris@3 318 }
Chris@3 319
Chris@3 320 CepstrumPitchTracker::ProgramList
Chris@3 321 CepstrumPitchTracker::getPrograms() const
Chris@3 322 {
Chris@3 323 ProgramList list;
Chris@3 324 return list;
Chris@3 325 }
Chris@3 326
Chris@3 327 string
Chris@3 328 CepstrumPitchTracker::getCurrentProgram() const
Chris@3 329 {
Chris@3 330 return ""; // no programs
Chris@3 331 }
Chris@3 332
Chris@3 333 void
Chris@3 334 CepstrumPitchTracker::selectProgram(string name)
Chris@3 335 {
Chris@3 336 }
Chris@3 337
Chris@3 338 CepstrumPitchTracker::OutputList
Chris@3 339 CepstrumPitchTracker::getOutputDescriptors() const
Chris@3 340 {
Chris@3 341 OutputList outputs;
Chris@3 342
Chris@3 343 int n = 0;
Chris@3 344
Chris@3 345 OutputDescriptor d;
Chris@3 346
Chris@3 347 d.identifier = "f0";
Chris@3 348 d.name = "Estimated f0";
Chris@3 349 d.description = "Estimated fundamental frequency";
Chris@3 350 d.unit = "Hz";
Chris@3 351 d.hasFixedBinCount = true;
Chris@3 352 d.binCount = 1;
Chris@3 353 d.hasKnownExtents = true;
Chris@3 354 d.minValue = m_fmin;
Chris@3 355 d.maxValue = m_fmax;
Chris@3 356 d.isQuantized = false;
Chris@3 357 d.sampleType = OutputDescriptor::FixedSampleRate;
Chris@3 358 d.sampleRate = (m_inputSampleRate / m_stepSize);
Chris@3 359 d.hasDuration = false;
Chris@3 360 outputs.push_back(d);
Chris@3 361
Chris@16 362 d.identifier = "notes";
Chris@16 363 d.name = "Notes";
Chris@16 364 d.description = "Derived fixed-pitch note frequencies";
Chris@16 365 d.unit = "Hz";
Chris@16 366 d.hasFixedBinCount = true;
Chris@16 367 d.binCount = 1;
Chris@16 368 d.hasKnownExtents = true;
Chris@16 369 d.minValue = m_fmin;
Chris@16 370 d.maxValue = m_fmax;
Chris@16 371 d.isQuantized = false;
Chris@16 372 d.sampleType = OutputDescriptor::FixedSampleRate;
Chris@16 373 d.sampleRate = (m_inputSampleRate / m_stepSize);
Chris@16 374 d.hasDuration = true;
Chris@16 375 outputs.push_back(d);
Chris@16 376
Chris@3 377 return outputs;
Chris@3 378 }
Chris@3 379
Chris@3 380 bool
Chris@3 381 CepstrumPitchTracker::initialise(size_t channels, size_t stepSize, size_t blockSize)
Chris@3 382 {
Chris@3 383 if (channels < getMinChannelCount() ||
Chris@3 384 channels > getMaxChannelCount()) return false;
Chris@3 385
Chris@3 386 // std::cerr << "CepstrumPitchTracker::initialise: channels = " << channels
Chris@3 387 // << ", stepSize = " << stepSize << ", blockSize = " << blockSize
Chris@3 388 // << std::endl;
Chris@3 389
Chris@3 390 m_channels = channels;
Chris@3 391 m_stepSize = stepSize;
Chris@3 392 m_blockSize = blockSize;
Chris@3 393
Chris@3 394 m_binFrom = int(m_inputSampleRate / m_fmax);
Chris@3 395 m_binTo = int(m_inputSampleRate / m_fmin);
Chris@3 396
Chris@3 397 if (m_binTo >= (int)m_blockSize / 2) {
Chris@3 398 m_binTo = m_blockSize / 2 - 1;
Chris@3 399 }
Chris@3 400
Chris@3 401 m_bins = (m_binTo - m_binFrom) + 1;
Chris@3 402
Chris@3 403 reset();
Chris@3 404
Chris@3 405 return true;
Chris@3 406 }
Chris@3 407
Chris@3 408 void
Chris@3 409 CepstrumPitchTracker::reset()
Chris@3 410 {
Chris@3 411 }
Chris@3 412
Chris@3 413 void
Chris@15 414 CepstrumPitchTracker::filter(const double *cep, double *data)
Chris@3 415 {
Chris@3 416 for (int i = 0; i < m_bins; ++i) {
Chris@5 417 double v = 0;
Chris@5 418 int n = 0;
Chris@5 419 // average according to the vertical filter length
Chris@5 420 for (int j = -m_vflen/2; j <= m_vflen/2; ++j) {
Chris@5 421 int ix = i + m_binFrom + j;
Chris@5 422 if (ix >= 0 && ix < m_blockSize) {
Chris@5 423 v += cep[ix];
Chris@5 424 ++n;
Chris@5 425 }
Chris@5 426 }
Chris@15 427 data[i] = v / n;
Chris@3 428 }
Chris@6 429 }
Chris@6 430
Chris@18 431 double
Chris@18 432 CepstrumPitchTracker::cubicInterpolate(const double y[4], double x)
Chris@18 433 {
Chris@18 434 double a0 = y[3] - y[2] - y[0] + y[1];
Chris@18 435 double a1 = y[0] - y[1] - a0;
Chris@18 436 double a2 = y[2] - y[0];
Chris@18 437 double a3 = y[1];
Chris@18 438 return
Chris@18 439 a0 * x * x * x +
Chris@18 440 a1 * x * x +
Chris@18 441 a2 * x +
Chris@18 442 a3;
Chris@18 443 }
Chris@18 444
Chris@18 445 double
Chris@18 446 CepstrumPitchTracker::findInterpolatedPeak(const double *in, int maxbin)
Chris@18 447 {
Chris@18 448 if (maxbin < 2 || maxbin > m_bins - 3) {
Chris@18 449 return maxbin;
Chris@18 450 }
Chris@18 451
Chris@18 452 double maxval = 0.0;
Chris@18 453 double maxidx = maxbin;
Chris@18 454
Chris@18 455 const int divisions = 10;
Chris@18 456 double y[4];
Chris@18 457
Chris@18 458 y[0] = in[maxbin-1];
Chris@18 459 y[1] = in[maxbin];
Chris@18 460 y[2] = in[maxbin+1];
Chris@18 461 y[3] = in[maxbin+2];
Chris@18 462 for (int i = 0; i < divisions; ++i) {
Chris@18 463 double probe = double(i) / double(divisions);
Chris@18 464 double value = cubicInterpolate(y, probe);
Chris@18 465 if (value > maxval) {
Chris@18 466 maxval = value;
Chris@18 467 maxidx = maxbin + probe;
Chris@18 468 }
Chris@18 469 }
Chris@18 470
Chris@18 471 y[3] = y[2];
Chris@18 472 y[2] = y[1];
Chris@18 473 y[1] = y[0];
Chris@18 474 y[0] = in[maxbin-2];
Chris@18 475 for (int i = 0; i < divisions; ++i) {
Chris@18 476 double probe = double(i) / double(divisions);
Chris@18 477 double value = cubicInterpolate(y, probe);
Chris@18 478 if (value > maxval) {
Chris@18 479 maxval = value;
Chris@18 480 maxidx = maxbin - 1 + probe;
Chris@18 481 }
Chris@18 482 }
Chris@18 483
Chris@18 484 /*
Chris@18 485 std::cerr << "centre = " << maxbin << ": ["
Chris@18 486 << in[maxbin-2] << ","
Chris@18 487 << in[maxbin-1] << ","
Chris@18 488 << in[maxbin] << ","
Chris@18 489 << in[maxbin+1] << ","
Chris@18 490 << in[maxbin+2] << "] -> " << maxidx << std::endl;
Chris@18 491 */
Chris@18 492
Chris@18 493 return maxidx;
Chris@18 494 }
Chris@18 495
Chris@3 496 CepstrumPitchTracker::FeatureSet
Chris@16 497 CepstrumPitchTracker::process(const float *const *inputBuffers, RealTime timestamp)
Chris@3 498 {
Chris@3 499 FeatureSet fs;
Chris@3 500
Chris@3 501 int bs = m_blockSize;
Chris@3 502 int hs = m_blockSize/2 + 1;
Chris@3 503
Chris@3 504 double *rawcep = new double[bs];
Chris@3 505 double *io = new double[bs];
Chris@3 506 double *logmag = new double[bs];
Chris@3 507
Chris@4 508 // The "inverse symmetric" method. Seems to be the most reliable
Chris@3 509
Chris@3 510 for (int i = 0; i < hs; ++i) {
Chris@3 511
Chris@3 512 double power =
Chris@3 513 inputBuffers[0][i*2 ] * inputBuffers[0][i*2 ] +
Chris@3 514 inputBuffers[0][i*2+1] * inputBuffers[0][i*2+1];
Chris@3 515 double mag = sqrt(power);
Chris@3 516
Chris@3 517 double lm = log(mag + 0.00000001);
Chris@3 518
Chris@4 519 logmag[i] = lm;
Chris@4 520 if (i > 0) logmag[bs - i] = lm;
Chris@3 521 }
Chris@3 522
Chris@4 523 fft(bs, true, logmag, 0, rawcep, io);
Chris@3 524
Chris@3 525 delete[] logmag;
Chris@3 526 delete[] io;
Chris@3 527
Chris@22 528 double cep1 = rawcep[1];
Chris@22 529
Chris@3 530 int n = m_bins;
Chris@3 531 double *data = new double[n];
Chris@3 532 filter(rawcep, data);
Chris@3 533 delete[] rawcep;
Chris@3 534
Chris@3 535 double maxval = 0.0;
Chris@6 536 int maxbin = -1;
Chris@3 537
Chris@3 538 for (int i = 0; i < n; ++i) {
Chris@3 539 if (data[i] > maxval) {
Chris@3 540 maxval = data[i];
Chris@3 541 maxbin = i;
Chris@3 542 }
Chris@3 543 }
Chris@3 544
Chris@15 545 if (maxbin < 0) {
Chris@15 546 delete[] data;
Chris@15 547 return fs;
Chris@15 548 }
Chris@15 549
Chris@15 550 double nextPeakVal = 0.0;
Chris@15 551 for (int i = 1; i+1 < n; ++i) {
Chris@15 552 if (data[i] > data[i-1] &&
Chris@15 553 data[i] > data[i+1] &&
Chris@15 554 i != maxbin &&
Chris@15 555 data[i] > nextPeakVal) {
Chris@15 556 nextPeakVal = data[i];
Chris@15 557 }
Chris@15 558 }
Chris@8 559
Chris@18 560 double cimax = findInterpolatedPeak(data, maxbin);
Chris@18 561 double peakfreq = m_inputSampleRate / (cimax + m_binFrom);
Chris@15 562
Chris@15 563 double confidence = 0.0;
Chris@15 564 if (nextPeakVal != 0.0) {
Chris@22 565 std::cerr << "maxval = " << maxval << ", cep1 = " << cep1 << std::endl;
Chris@22 566 double conf0 = (maxval - nextPeakVal) / 80.0;
Chris@22 567 double conf1 = (cep1 / bs) / 2;
Chris@22 568 if (conf0 > 1.0) conf0 = 1.0;
Chris@22 569 if (conf1 > 1.0) conf1 = 1.0;
Chris@22 570 confidence = conf0 * conf1;
Chris@22 571 std::cerr << "conf0 = " << conf0 << ", conf1 = " << conf1 << ", confidence = " << confidence << std::endl;
Chris@15 572 }
Chris@15 573
Chris@8 574 Hypothesis::Estimate e;
Chris@8 575 e.freq = peakfreq;
Chris@8 576 e.time = timestamp;
Chris@15 577 e.confidence = confidence;
Chris@8 578
Chris@8 579 m_accepted.advanceTime();
Chris@11 580
Chris@8 581 for (int i = 0; i < m_possible.size(); ++i) {
Chris@8 582 m_possible[i].advanceTime();
Chris@8 583 }
Chris@8 584
Chris@11 585 if (!m_accepted.test(e)) {
Chris@13 586
Chris@11 587 int candidate = -1;
Chris@13 588 bool accepted = false;
Chris@13 589
Chris@11 590 for (int i = 0; i < m_possible.size(); ++i) {
Chris@11 591 if (m_possible[i].test(e)) {
Chris@13 592 accepted = true;
Chris@11 593 if (m_possible[i].getState() == Hypothesis::Satisfied) {
Chris@11 594 candidate = i;
Chris@11 595 }
Chris@11 596 break;
Chris@11 597 }
Chris@11 598 }
Chris@12 599
Chris@13 600 if (!accepted) {
Chris@13 601 Hypothesis h;
Chris@13 602 h.test(e); //!!! must succeed as h is new, so perhaps there should be a ctor for this
Chris@13 603 m_possible.push_back(h);
Chris@13 604 }
Chris@13 605
Chris@11 606 if (m_accepted.getState() == Hypothesis::Expired) {
Chris@16 607 m_accepted.addFeatures(fs);
Chris@12 608 }
Chris@12 609
Chris@12 610 if (m_accepted.getState() == Hypothesis::Expired ||
Chris@12 611 m_accepted.getState() == Hypothesis::Rejected) {
Chris@11 612 if (candidate >= 0) {
Chris@11 613 m_accepted = m_possible[candidate];
Chris@11 614 } else {
Chris@11 615 m_accepted = Hypothesis();
Chris@11 616 }
Chris@11 617 }
Chris@8 618
Chris@14 619 // reap rejected/expired hypotheses from possible list
Chris@14 620 Hypotheses toReap = m_possible;
Chris@14 621 m_possible.clear();
Chris@14 622 for (int i = 0; i < toReap.size(); ++i) {
Chris@14 623 Hypothesis h = toReap[i];
Chris@14 624 if (h.getState() != Hypothesis::Rejected &&
Chris@14 625 h.getState() != Hypothesis::Expired) {
Chris@14 626 m_possible.push_back(h);
Chris@14 627 }
Chris@14 628 }
Chris@14 629 }
Chris@14 630
Chris@15 631 std::cerr << "accepted length = " << m_accepted.getPendingLength()
Chris@15 632 << ", state = " << m_accepted.getState()
Chris@15 633 << ", hypothesis count = " << m_possible.size() << std::endl;
Chris@12 634
Chris@3 635 delete[] data;
Chris@3 636 return fs;
Chris@3 637 }
Chris@3 638
Chris@3 639 CepstrumPitchTracker::FeatureSet
Chris@3 640 CepstrumPitchTracker::getRemainingFeatures()
Chris@3 641 {
Chris@3 642 FeatureSet fs;
Chris@15 643 if (m_accepted.getState() == Hypothesis::Satisfied) {
Chris@16 644 m_accepted.addFeatures(fs);
Chris@11 645 }
Chris@3 646 return fs;
Chris@3 647 }
Chris@3 648
Chris@3 649 void
Chris@3 650 CepstrumPitchTracker::fft(unsigned int n, bool inverse,
Chris@3 651 double *ri, double *ii, double *ro, double *io)
Chris@3 652 {
Chris@3 653 if (!ri || !ro || !io) return;
Chris@3 654
Chris@3 655 unsigned int bits;
Chris@3 656 unsigned int i, j, k, m;
Chris@3 657 unsigned int blockSize, blockEnd;
Chris@3 658
Chris@3 659 double tr, ti;
Chris@3 660
Chris@3 661 if (n < 2) return;
Chris@3 662 if (n & (n-1)) return;
Chris@3 663
Chris@3 664 double angle = 2.0 * M_PI;
Chris@3 665 if (inverse) angle = -angle;
Chris@3 666
Chris@3 667 for (i = 0; ; ++i) {
Chris@3 668 if (n & (1 << i)) {
Chris@3 669 bits = i;
Chris@3 670 break;
Chris@3 671 }
Chris@3 672 }
Chris@3 673
Chris@23 674 int *table = new int[n];
Chris@3 675
Chris@23 676 for (i = 0; i < n; ++i) {
Chris@23 677
Chris@23 678 m = i;
Chris@3 679
Chris@23 680 for (j = k = 0; j < bits; ++j) {
Chris@23 681 k = (k << 1) | (m & 1);
Chris@23 682 m >>= 1;
Chris@23 683 }
Chris@3 684
Chris@23 685 table[i] = k;
Chris@3 686 }
Chris@3 687
Chris@3 688 if (ii) {
Chris@3 689 for (i = 0; i < n; ++i) {
Chris@3 690 ro[table[i]] = ri[i];
Chris@3 691 io[table[i]] = ii[i];
Chris@3 692 }
Chris@3 693 } else {
Chris@3 694 for (i = 0; i < n; ++i) {
Chris@3 695 ro[table[i]] = ri[i];
Chris@3 696 io[table[i]] = 0.0;
Chris@3 697 }
Chris@3 698 }
Chris@3 699
Chris@3 700 blockEnd = 1;
Chris@3 701
Chris@3 702 for (blockSize = 2; blockSize <= n; blockSize <<= 1) {
Chris@3 703
Chris@3 704 double delta = angle / (double)blockSize;
Chris@3 705 double sm2 = -sin(-2 * delta);
Chris@3 706 double sm1 = -sin(-delta);
Chris@3 707 double cm2 = cos(-2 * delta);
Chris@3 708 double cm1 = cos(-delta);
Chris@3 709 double w = 2 * cm1;
Chris@3 710 double ar[3], ai[3];
Chris@3 711
Chris@3 712 for (i = 0; i < n; i += blockSize) {
Chris@3 713
Chris@3 714 ar[2] = cm2;
Chris@3 715 ar[1] = cm1;
Chris@3 716
Chris@3 717 ai[2] = sm2;
Chris@3 718 ai[1] = sm1;
Chris@3 719
Chris@3 720 for (j = i, m = 0; m < blockEnd; j++, m++) {
Chris@3 721
Chris@3 722 ar[0] = w * ar[1] - ar[2];
Chris@3 723 ar[2] = ar[1];
Chris@3 724 ar[1] = ar[0];
Chris@3 725
Chris@3 726 ai[0] = w * ai[1] - ai[2];
Chris@3 727 ai[2] = ai[1];
Chris@3 728 ai[1] = ai[0];
Chris@3 729
Chris@3 730 k = j + blockEnd;
Chris@3 731 tr = ar[0] * ro[k] - ai[0] * io[k];
Chris@3 732 ti = ar[0] * io[k] + ai[0] * ro[k];
Chris@3 733
Chris@3 734 ro[k] = ro[j] - tr;
Chris@3 735 io[k] = io[j] - ti;
Chris@3 736
Chris@3 737 ro[j] += tr;
Chris@3 738 io[j] += ti;
Chris@3 739 }
Chris@3 740 }
Chris@3 741
Chris@3 742 blockEnd = blockSize;
Chris@3 743 }
Chris@3 744 }
Chris@3 745
Chris@3 746