annotate plugins/BarBeatTrack.cpp @ 93:385bec9df059

* minor tidy
author Chris Cannam <c.cannam@qmul.ac.uk>
date Fri, 27 Feb 2009 13:07:07 +0000
parents 52c6817a414e
children e51152b7ee06
rev   line source
c@89 1 /* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */
c@89 2
c@89 3 /*
c@89 4 QM Vamp Plugin Set
c@89 5
c@89 6 Centre for Digital Music, Queen Mary, University of London.
c@89 7 All rights reserved.
c@89 8 */
c@89 9
c@89 10 #include "BarBeatTrack.h"
c@89 11
c@89 12 #include <dsp/onsets/DetectionFunction.h>
c@89 13 #include <dsp/onsets/PeakPicking.h>
c@89 14 #include <dsp/tempotracking/TempoTrackV2.h>
c@89 15 #include <dsp/tempotracking/DownBeat.h>
c@89 16 #include <maths/MathUtilities.h>
c@89 17
c@89 18 using std::string;
c@89 19 using std::vector;
c@89 20 using std::cerr;
c@89 21 using std::endl;
c@89 22
c@89 23 float BarBeatTracker::m_stepSecs = 0.01161; // 512 samples at 44100
c@89 24
c@89 25 class BarBeatTrackerData
c@89 26 {
c@89 27 public:
c@89 28 BarBeatTrackerData(float rate, const DFConfig &config) : dfConfig(config) {
c@89 29 df = new DetectionFunction(config);
c@89 30 // decimation factor aims at resampling to c. 3KHz; must be power of 2
c@89 31 int factor = MathUtilities::nextPowerOfTwo(rate / 3000);
c@89 32 std::cerr << "BarBeatTrackerData: factor = " << factor << std::endl;
c@89 33 downBeat = new DownBeat(rate, factor, config.stepSize);
c@89 34 }
c@89 35 ~BarBeatTrackerData() {
c@89 36 delete df;
c@89 37 delete downBeat;
c@89 38 }
c@89 39 void reset() {
c@89 40 delete df;
c@89 41 df = new DetectionFunction(dfConfig);
c@89 42 dfOutput.clear();
c@89 43 downBeat->resetAudioBuffer();
c@89 44 origin = Vamp::RealTime::zeroTime;
c@89 45 }
c@89 46
c@89 47 DFConfig dfConfig;
c@89 48 DetectionFunction *df;
c@89 49 DownBeat *downBeat;
c@89 50 vector<double> dfOutput;
c@89 51 Vamp::RealTime origin;
c@89 52 };
c@89 53
c@89 54
c@89 55 BarBeatTracker::BarBeatTracker(float inputSampleRate) :
c@89 56 Vamp::Plugin(inputSampleRate),
c@89 57 m_d(0),
c@89 58 m_bpb(4)
c@89 59 {
c@89 60 }
c@89 61
c@89 62 BarBeatTracker::~BarBeatTracker()
c@89 63 {
c@89 64 delete m_d;
c@89 65 }
c@89 66
c@89 67 string
c@89 68 BarBeatTracker::getIdentifier() const
c@89 69 {
c@89 70 return "qm-barbeattracker";
c@89 71 }
c@89 72
c@89 73 string
c@89 74 BarBeatTracker::getName() const
c@89 75 {
c@89 76 return "Bar and Beat Tracker";
c@89 77 }
c@89 78
c@89 79 string
c@89 80 BarBeatTracker::getDescription() const
c@89 81 {
c@89 82 return "Estimate bar and beat locations";
c@89 83 }
c@89 84
c@89 85 string
c@89 86 BarBeatTracker::getMaker() const
c@89 87 {
c@89 88 return "Queen Mary, University of London";
c@89 89 }
c@89 90
c@89 91 int
c@89 92 BarBeatTracker::getPluginVersion() const
c@89 93 {
c@89 94 return 1;
c@89 95 }
c@89 96
c@89 97 string
c@89 98 BarBeatTracker::getCopyright() const
c@89 99 {
c@89 100 return "Plugin by Matthew Davies, Christian Landone and Chris Cannam. Copyright (c) 2006-2009 QMUL - All Rights Reserved";
c@89 101 }
c@89 102
c@89 103 BarBeatTracker::ParameterList
c@89 104 BarBeatTracker::getParameterDescriptors() const
c@89 105 {
c@89 106 ParameterList list;
c@89 107
c@89 108 ParameterDescriptor desc;
c@89 109
c@89 110 desc.identifier = "bpb";
c@89 111 desc.name = "Beats per Bar";
c@89 112 desc.description = "The number of beats in each bar";
c@89 113 desc.minValue = 2;
c@89 114 desc.maxValue = 16;
c@89 115 desc.defaultValue = 4;
c@89 116 desc.isQuantized = true;
c@89 117 desc.quantizeStep = 1;
c@89 118 list.push_back(desc);
c@89 119
c@89 120 return list;
c@89 121 }
c@89 122
c@89 123 float
c@89 124 BarBeatTracker::getParameter(std::string name) const
c@89 125 {
c@89 126 if (name == "bpb") return m_bpb;
c@89 127 return 0.0;
c@89 128 }
c@89 129
c@89 130 void
c@89 131 BarBeatTracker::setParameter(std::string name, float value)
c@89 132 {
c@89 133 if (name == "bpb") m_bpb = lrintf(value);
c@89 134 }
c@89 135
c@89 136 bool
c@89 137 BarBeatTracker::initialise(size_t channels, size_t stepSize, size_t blockSize)
c@89 138 {
c@89 139 if (m_d) {
c@89 140 delete m_d;
c@89 141 m_d = 0;
c@89 142 }
c@89 143
c@89 144 if (channels < getMinChannelCount() ||
c@89 145 channels > getMaxChannelCount()) {
c@89 146 std::cerr << "BarBeatTracker::initialise: Unsupported channel count: "
c@89 147 << channels << std::endl;
c@89 148 return false;
c@89 149 }
c@89 150
c@89 151 if (stepSize != getPreferredStepSize()) {
c@89 152 std::cerr << "ERROR: BarBeatTracker::initialise: Unsupported step size for this sample rate: "
c@89 153 << stepSize << " (wanted " << (getPreferredStepSize()) << ")" << std::endl;
c@89 154 return false;
c@89 155 }
c@89 156
c@89 157 if (blockSize != getPreferredBlockSize()) {
c@89 158 std::cerr << "WARNING: BarBeatTracker::initialise: Sub-optimal block size for this sample rate: "
c@89 159 << blockSize << " (wanted " << getPreferredBlockSize() << ")" << std::endl;
c@89 160 // return false;
c@89 161 }
c@89 162
c@89 163 DFConfig dfConfig;
c@89 164 dfConfig.DFType = DF_COMPLEXSD;
c@89 165 dfConfig.stepSize = stepSize;
c@89 166 dfConfig.frameLength = blockSize;
c@89 167 dfConfig.dbRise = 3;
c@89 168 dfConfig.adaptiveWhitening = false;
c@89 169 dfConfig.whiteningRelaxCoeff = -1;
c@89 170 dfConfig.whiteningFloor = -1;
c@89 171
c@89 172 m_d = new BarBeatTrackerData(m_inputSampleRate, dfConfig);
c@89 173 m_d->downBeat->setBeatsPerBar(m_bpb);
c@89 174 return true;
c@89 175 }
c@89 176
c@89 177 void
c@89 178 BarBeatTracker::reset()
c@89 179 {
c@89 180 if (m_d) m_d->reset();
c@89 181 }
c@89 182
c@89 183 size_t
c@89 184 BarBeatTracker::getPreferredStepSize() const
c@89 185 {
c@89 186 size_t step = size_t(m_inputSampleRate * m_stepSecs + 0.0001);
c@89 187 // std::cerr << "BarBeatTracker::getPreferredStepSize: input sample rate is " << m_inputSampleRate << ", step size is " << step << std::endl;
c@89 188 return step;
c@89 189 }
c@89 190
c@89 191 size_t
c@89 192 BarBeatTracker::getPreferredBlockSize() const
c@89 193 {
c@89 194 size_t theoretical = getPreferredStepSize() * 2;
c@89 195
c@89 196 // I think this is not necessarily going to be a power of two, and
c@89 197 // the host might have a problem with that, but I'm not sure we
c@89 198 // can do much about it here
c@89 199 return theoretical;
c@89 200 }
c@89 201
c@89 202 BarBeatTracker::OutputList
c@89 203 BarBeatTracker::getOutputDescriptors() const
c@89 204 {
c@89 205 OutputList list;
c@89 206
c@89 207 OutputDescriptor beat;
c@89 208 beat.identifier = "beats";
c@89 209 beat.name = "Beats";
c@89 210 beat.description = "Beat locations labelled with metrical position";
c@89 211 beat.unit = "";
c@89 212 beat.hasFixedBinCount = true;
c@89 213 beat.binCount = 0;
c@89 214 beat.sampleType = OutputDescriptor::VariableSampleRate;
c@89 215 beat.sampleRate = 1.0 / m_stepSecs;
c@89 216
c@89 217 OutputDescriptor bars;
c@89 218 bars.identifier = "bars";
c@89 219 bars.name = "Bars";
c@89 220 bars.description = "Bar locations";
c@89 221 bars.unit = "";
c@89 222 bars.hasFixedBinCount = true;
c@89 223 bars.binCount = 0;
c@89 224 bars.sampleType = OutputDescriptor::VariableSampleRate;
c@89 225 bars.sampleRate = 1.0 / m_stepSecs;
c@89 226
c@89 227 OutputDescriptor beatcounts;
c@89 228 beatcounts.identifier = "beatcounts";
c@89 229 beatcounts.name = "Beat Count";
c@89 230 beatcounts.description = "Beat counter function";
c@89 231 beatcounts.unit = "";
c@89 232 beatcounts.hasFixedBinCount = true;
c@89 233 beatcounts.binCount = 1;
c@89 234 beatcounts.sampleType = OutputDescriptor::VariableSampleRate;
c@89 235 beatcounts.sampleRate = 1.0 / m_stepSecs;
c@89 236
c@90 237 OutputDescriptor beatsd;
c@90 238 beatsd.identifier = "beatsd";
c@90 239 beatsd.name = "Beat Spectral Difference";
c@90 240 beatsd.description = "Beat spectral difference function used for bar-line detection";
c@90 241 beatsd.unit = "";
c@90 242 beatsd.hasFixedBinCount = true;
c@90 243 beatsd.binCount = 1;
c@90 244 beatsd.sampleType = OutputDescriptor::VariableSampleRate;
c@90 245 beatsd.sampleRate = 1.0 / m_stepSecs;
c@90 246
c@89 247 list.push_back(beat);
c@89 248 list.push_back(bars);
c@89 249 list.push_back(beatcounts);
c@90 250 list.push_back(beatsd);
c@89 251
c@89 252 return list;
c@89 253 }
c@89 254
c@89 255 BarBeatTracker::FeatureSet
c@89 256 BarBeatTracker::process(const float *const *inputBuffers,
c@89 257 Vamp::RealTime timestamp)
c@89 258 {
c@89 259 if (!m_d) {
c@89 260 cerr << "ERROR: BarBeatTracker::process: "
c@89 261 << "BarBeatTracker has not been initialised"
c@89 262 << endl;
c@89 263 return FeatureSet();
c@89 264 }
c@89 265
c@89 266 // We use time domain input, because DownBeat requires it -- so we
c@89 267 // use the time-domain version of DetectionFunction::process which
c@89 268 // does its own FFT. It requires doubles as input, so we need to
c@89 269 // make a temporary copy
c@89 270
c@89 271 // We only support a single input channel
c@89 272
c@89 273 const int fl = m_d->dfConfig.frameLength;
c@89 274 double dfinput[fl];
c@89 275 for (int i = 0; i < fl; ++i) dfinput[i] = inputBuffers[0][i];
c@89 276
c@89 277 double output = m_d->df->process(dfinput);
c@89 278
c@89 279 if (m_d->dfOutput.empty()) m_d->origin = timestamp;
c@89 280
c@93 281 // std::cerr << "df[" << m_d->dfOutput.size() << "] is " << output << std::endl;
c@89 282 m_d->dfOutput.push_back(output);
c@89 283
c@89 284 // Downsample and store the incoming audio block.
c@89 285 // We have an overlap on the incoming audio stream (step size is
c@89 286 // half block size) -- this function is configured to take only a
c@89 287 // step size's worth, so effectively ignoring the overlap. Note
c@89 288 // however that this means we omit the last blocksize - stepsize
c@89 289 // samples completely for the purposes of barline detection
c@89 290 // (hopefully not a problem)
c@89 291 m_d->downBeat->pushAudioBlock(inputBuffers[0]);
c@89 292
c@89 293 return FeatureSet();
c@89 294 }
c@89 295
c@89 296 BarBeatTracker::FeatureSet
c@89 297 BarBeatTracker::getRemainingFeatures()
c@89 298 {
c@89 299 if (!m_d) {
c@89 300 cerr << "ERROR: BarBeatTracker::getRemainingFeatures: "
c@89 301 << "BarBeatTracker has not been initialised"
c@89 302 << endl;
c@89 303 return FeatureSet();
c@89 304 }
c@89 305
c@89 306 return barBeatTrack();
c@89 307 }
c@89 308
c@89 309 BarBeatTracker::FeatureSet
c@89 310 BarBeatTracker::barBeatTrack()
c@89 311 {
c@89 312 vector<double> df;
c@89 313 vector<double> beatPeriod;
c@89 314 vector<double> tempi;
c@89 315
c@89 316 for (size_t i = 2; i < m_d->dfOutput.size(); ++i) { // discard first two elts
c@89 317 df.push_back(m_d->dfOutput[i]);
c@89 318 beatPeriod.push_back(0.0);
c@89 319 }
c@89 320 if (df.empty()) return FeatureSet();
c@89 321
c@89 322 TempoTrackV2 tt(m_inputSampleRate, m_d->dfConfig.stepSize);
c@89 323 tt.calculateBeatPeriod(df, beatPeriod, tempi);
c@89 324
c@89 325 vector<double> beats;
c@89 326 tt.calculateBeats(df, beatPeriod, beats);
c@89 327
c@89 328 vector<int> downbeats;
c@89 329 size_t downLength = 0;
c@89 330 const float *downsampled = m_d->downBeat->getBufferedAudio(downLength);
c@89 331 m_d->downBeat->findDownBeats(downsampled, downLength, beats, downbeats);
c@89 332
c@90 333 vector<double> beatsd;
c@90 334 m_d->downBeat->getBeatSD(beatsd);
c@90 335
c@89 336 // std::cerr << "BarBeatTracker: found downbeats at: ";
c@89 337 // for (int i = 0; i < downbeats.size(); ++i) std::cerr << downbeats[i] << " " << std::endl;
c@89 338
c@89 339 FeatureSet returnFeatures;
c@89 340
c@89 341 char label[20];
c@89 342
c@89 343 int dbi = 0;
c@89 344 int beat = 0;
c@89 345 int bar = 0;
c@89 346
c@89 347 for (size_t i = 0; i < beats.size(); ++i) {
c@89 348
c@89 349 size_t frame = beats[i] * m_d->dfConfig.stepSize;
c@89 350
c@89 351 if (dbi < downbeats.size() && i == downbeats[dbi]) {
c@89 352 beat = 0;
c@89 353 ++bar;
c@89 354 ++dbi;
c@89 355 } else {
c@89 356 ++beat;
c@89 357 }
c@89 358
c@89 359 // outputs are:
c@89 360 //
c@89 361 // 0 -> beats
c@89 362 // 1 -> bars
c@89 363 // 2 -> beat counter function
c@89 364
c@89 365 Feature feature;
c@89 366 feature.hasTimestamp = true;
c@89 367 feature.timestamp = m_d->origin + Vamp::RealTime::frame2RealTime
c@89 368 (frame, lrintf(m_inputSampleRate));
c@89 369
c@89 370 sprintf(label, "%d", beat + 1);
c@89 371 feature.label = label;
c@89 372 returnFeatures[0].push_back(feature); // labelled beats
c@89 373
c@89 374 feature.values.push_back(beat + 1);
c@89 375 returnFeatures[2].push_back(feature); // beat function
c@89 376
c@90 377 if (i > 0 && i <= beatsd.size()) {
c@90 378 feature.values.clear();
c@90 379 feature.values.push_back(beatsd[i-1]);
c@90 380 feature.label = "";
c@90 381 returnFeatures[3].push_back(feature); // beat spectral difference
c@90 382 }
c@90 383
c@89 384 if (beat == 0) {
c@89 385 feature.values.clear();
c@89 386 sprintf(label, "%d", bar);
c@89 387 feature.label = label;
c@89 388 returnFeatures[1].push_back(feature); // bars
c@89 389 }
c@89 390 }
c@89 391
c@89 392 return returnFeatures;
c@89 393 }
c@89 394