vamp-tempogram: TempogramPlugin.cpp annotate

annotate TempogramPlugin.cpp @ 51:c7cc649dc9b6

* I had made further changes to previous revisions accidentally. Now should wor.

author	Carl Bussey <c.bussey@se10.qmul.ac.uk>
date	Tue, 30 Sep 2014 16:19:31 +0100
parents	45ba1627d802
children	eff9dc53de62

rev	line source
Chris@43	1 /* -- c-basic-offset: 4 indent-tabs-mode: nil -- vi:set ts=8 sts=4 sw=4: */
c@0	2
Chris@43	3 /*
Chris@43	4 Vamp Tempogram Plugin
Chris@43	5 Carl Bussey, Centre for Digital Music, Queen Mary University of London
Chris@43	6 Copyright 2014 Queen Mary University of London.
Chris@43	7
Chris@43	8 This program is free software; you can redistribute it and/or
Chris@43	9 modify it under the terms of the GNU General Public License as
Chris@43	10 published by the Free Software Foundation; either version 2 of the
Chris@43	11 License, or (at your option) any later version. See the file
Chris@43	12 COPYING included with this distribution for more information.
Chris@43	13 */
c@0	14
c@14	15 #include "TempogramPlugin.h"
c@25	16
c@0	17 using Vamp::FFT;
c@7	18 using Vamp::RealTime;
c@0	19 using namespace std;
c@0	20
c@14	21 TempogramPlugin::TempogramPlugin(float inputSampleRate) :
c@0	22 Plugin(inputSampleRate),
c@18	23 m_inputBlockSize(0), //host parameter
c@18	24 m_inputStepSize(0), //host parameter
c@29	25 m_noveltyCurveMinDB(-74), //parameter
c@29	26 m_noveltyCurveMinV(0), //set in initialise()
c@18	27 m_noveltyCurveCompressionConstant(1000), //parameter
c@18	28 m_tempogramLog2WindowLength(10), //parameter
c@29	29 m_tempogramWindowLength(0), //set in initialise()
c@18	30 m_tempogramLog2FftLength(m_tempogramLog2WindowLength), //parameter
c@29	31 m_tempogramFftLength(0), //set in initialise()
c@18	32 m_tempogramLog2HopSize(6), //parameter
c@29	33 m_tempogramHopSize(0), //set in initialise()
c@18	34 m_tempogramMinBPM(30), //parameter
c@18	35 m_tempogramMaxBPM(480), //parameter
c@18	36 m_tempogramMinBin(0), //set in initialise()
c@18	37 m_tempogramMaxBin(0), //set in initialise()
c@29	38 m_tempogramMinLag(0), //set in initialise()
c@29	39 m_tempogramMaxLag(0), //set in initialise()
c@18	40 m_cyclicTempogramMinBPM(30), //reset in initialise()
c@18	41 m_cyclicTempogramNumberOfOctaves(0), //set in initialise()
c@49	42 m_cyclicTempogramOctaveDivider(30), //parameter
c@50	43 m_cyclicTempogramReferenceBPM(60) //parameter
c@0	44
c@0	45 // Also be sure to set your plugin parameters (presumably stored
c@0	46 // in member variables) to their default values here -- the host
c@0	47 // will not do that for you
c@0	48 {
c@0	49 }
c@0	50
c@14	51 TempogramPlugin::~TempogramPlugin()
c@0	52 {
c@0	53 //delete stuff
c@0	54 }
c@0	55
c@0	56 string
c@14	57 TempogramPlugin::getIdentifier() const
c@0	58 {
c@0	59 return "tempogram";
c@0	60 }
c@0	61
c@0	62 string
c@14	63 TempogramPlugin::getName() const
c@0	64 {
c@0	65 return "Tempogram";
c@0	66 }
c@0	67
c@0	68 string
c@14	69 TempogramPlugin::getDescription() const
c@0	70 {
c@0	71 return "Cyclic Tempogram as described by Peter Grosche and Meinard Muller";
c@0	72 }
c@0	73
c@0	74 string
c@14	75 TempogramPlugin::getMaker() const
c@0	76 {
c@0	77 return "Carl Bussey";
c@0	78 }
c@0	79
c@0	80 int
c@14	81 TempogramPlugin::getPluginVersion() const
c@0	82 {
c@0	83 return 1;
c@0	84 }
c@0	85
c@0	86 string
c@14	87 TempogramPlugin::getCopyright() const
c@0	88 {
Chris@40	89 return "Copyright 2014 Queen Mary University of London. GPL licence.";
c@0	90 }
c@0	91
c@14	92 TempogramPlugin::InputDomain
c@14	93 TempogramPlugin::getInputDomain() const
c@0	94 {
c@0	95 return FrequencyDomain;
c@0	96 }
c@0	97
c@0	98 size_t
c@14	99 TempogramPlugin::getPreferredBlockSize() const
c@0	100 {
c@9	101 return 2048; // 0 means "I can handle any block size"
c@0	102 }
c@0	103
c@0	104 size_t
c@14	105 TempogramPlugin::getPreferredStepSize() const
c@0	106 {
c@9	107 return 1024; // 0 means "anything sensible"; in practice this
c@0	108 // means the same as the block size for TimeDomain
c@0	109 // plugins, or half of it for FrequencyDomain plugins
c@0	110 }
c@0	111
c@0	112 size_t
c@14	113 TempogramPlugin::getMinChannelCount() const
c@0	114 {
c@0	115 return 1;
c@0	116 }
c@0	117
c@0	118 size_t
c@14	119 TempogramPlugin::getMaxChannelCount() const
c@0	120 {
c@0	121 return 1;
c@0	122 }
c@0	123
c@14	124 TempogramPlugin::ParameterList
c@14	125 TempogramPlugin::getParameterDescriptors() const
c@0	126 {
c@0	127 ParameterList list;
c@0	128
c@0	129 // If the plugin has no adjustable parameters, return an empty
c@0	130 // list here (and there's no need to provide implementations of
c@0	131 // getParameter and setParameter in that case either).
c@0	132
c@0	133 // Note that it is your responsibility to make sure the parameters
c@0	134 // start off having their default values (e.g. in the constructor
c@0	135 // above). The host needs to know the default value so it can do
c@0	136 // things like provide a "reset to default" function, but it will
c@0	137 // not explicitly set your parameters to their defaults for you if
c@0	138 // they have not changed in the mean time.
c@0	139
c@14	140 ParameterDescriptor d1;
c@14	141 d1.identifier = "C";
c@15	142 d1.name = "Novelty Curve Spectrogram Compression Constant";
c@14	143 d1.description = "Spectrogram compression constant, C, used when retrieving the novelty curve from the audio.";
c@14	144 d1.unit = "";
c@14	145 d1.minValue = 2;
c@14	146 d1.maxValue = 10000;
c@14	147 d1.defaultValue = 1000;
c@14	148 d1.isQuantized = false;
c@14	149 list.push_back(d1);
c@29	150
c@29	151 ParameterDescriptor d2;
c@29	152 d2.identifier = "minDB";
c@29	153 d2.name = "Novelty Curve Minimum DB";
c@29	154 d2.description = "Spectrogram minimum DB used when removing unwanted peaks in the Spectrogram when retrieving the novelty curve from the audio.";
c@29	155 d2.unit = "";
c@29	156 d2.minValue = -100;
c@29	157 d2.maxValue = -50;
c@29	158 d2.defaultValue = -74;
c@29	159 d2.isQuantized = false;
c@29	160 list.push_back(d2);
c@9	161
c@14	162 ParameterDescriptor d3;
c@29	163 d3.identifier = "log2TN";
c@29	164 d3.name = "Tempogram Window Length";
c@29	165 d3.description = "FFT window length when analysing the novelty curve and extracting the tempogram time-frequency function.";
c@14	166 d3.unit = "";
c@29	167 d3.minValue = 7;
c@14	168 d3.maxValue = 12;
c@29	169 d3.defaultValue = 10;
c@14	170 d3.isQuantized = true;
c@14	171 d3.quantizeStep = 1;
c@14	172 for (int i = d3.minValue; i <= d3.maxValue; i++){
c@14	173 d3.valueNames.push_back(floatToString(pow((float)2,(float)i)));
c@14	174 }
c@14	175 list.push_back(d3);
c@9	176
c@14	177 ParameterDescriptor d4;
c@29	178 d4.identifier = "log2HopSize";
c@29	179 d4.name = "Tempogram Hopsize";
c@29	180 d4.description = "FFT hopsize when analysing the novelty curve and extracting the tempogram time-frequency function.";
c@14	181 d4.unit = "";
c@14	182 d4.minValue = 6;
c@14	183 d4.maxValue = 12;
c@29	184 d4.defaultValue = 6;
c@14	185 d4.isQuantized = true;
c@14	186 d4.quantizeStep = 1;
c@14	187 for (int i = d4.minValue; i <= d4.maxValue; i++){
c@14	188 d4.valueNames.push_back(floatToString(pow((float)2,(float)i)));
c@14	189 }
c@14	190 list.push_back(d4);
c@14	191
c@14	192 ParameterDescriptor d5;
c@29	193 d5.identifier = "log2FftLength";
c@29	194 d5.name = "Tempogram FFT Length";
c@29	195 d5.description = "FFT length when analysing the novelty curve and extracting the tempogram time-frequency function. This parameter determines the amount of zero padding.";
c@14	196 d5.unit = "";
c@29	197 d5.minValue = 6;
c@29	198 d5.maxValue = 12;
Chris@42	199 d5.defaultValue = 10;
c@14	200 d5.isQuantized = true;
c@29	201 d5.quantizeStep = 1;
c@29	202 for (int i = d5.minValue; i <= d5.maxValue; i++){
Chris@41	203 d5.valueNames.push_back(floatToString(pow((float)2,(float)i)));
c@29	204 }
c@14	205 list.push_back(d5);
c@14	206
c@14	207 ParameterDescriptor d6;
c@29	208 d6.identifier = "minBPM";
c@29	209 d6.name = "(Cyclic) Tempogram Minimum BPM";
c@29	210 d6.description = "The minimum BPM of the tempogram output bins.";
c@14	211 d6.unit = "";
c@29	212 d6.minValue = 0;
c@14	213 d6.maxValue = 2000;
c@29	214 d6.defaultValue = 30;
c@14	215 d6.isQuantized = true;
c@14	216 d6.quantizeStep = 5;
c@14	217 list.push_back(d6);
c@18	218
c@18	219 ParameterDescriptor d7;
c@29	220 d7.identifier = "maxBPM";
c@29	221 d7.name = "(Cyclic) Tempogram Maximum BPM";
c@29	222 d7.description = "The maximum BPM of the tempogram output bins.";
c@18	223 d7.unit = "";
c@29	224 d7.minValue = 30;
c@29	225 d7.maxValue = 2000;
c@29	226 d7.defaultValue = 480;
c@18	227 d7.isQuantized = true;
c@29	228 d7.quantizeStep = 5;
c@18	229 list.push_back(d7);
c@29	230
c@29	231 ParameterDescriptor d8;
c@29	232 d8.identifier = "octDiv";
c@29	233 d8.name = "Cyclic Tempogram Octave Divider";
c@29	234 d8.description = "The number bins within each octave.";
c@29	235 d8.unit = "";
c@29	236 d8.minValue = 5;
c@29	237 d8.maxValue = 60;
c@29	238 d8.defaultValue = 30;
c@29	239 d8.isQuantized = true;
c@29	240 d8.quantizeStep = 1;
c@29	241 list.push_back(d8);
c@51	242
c@51	243 ParameterDescriptor d9;
c@51	244 d8.identifier = "refBPM";
c@51	245 d8.name = "Cyclic Tempogram Reference Tempo";
c@51	246 d8.description = "The reference tempo used when calculating the Cyclic Tempogram parameter \'s\'.";
c@51	247 d8.unit = "";
c@51	248 d8.minValue = 5;
c@51	249 d8.maxValue = 60;
c@51	250 d8.defaultValue = 30;
c@51	251 d8.isQuantized = true;
c@51	252 d8.quantizeStep = 1;
c@51	253 list.push_back(d8);
c@0	254
c@0	255 return list;
c@0	256 }
c@0	257
c@0	258 float
c@14	259 TempogramPlugin::getParameter(string identifier) const
c@0	260 {
c@0	261 if (identifier == "C") {
c@18	262 return m_noveltyCurveCompressionConstant; // return the ACTUAL current value of your parameter here!
c@0	263 }
c@29	264 else if (identifier == "minDB"){
c@29	265 return m_noveltyCurveMinDB;
c@29	266 }
c@14	267 else if (identifier == "log2TN"){
c@18	268 return m_tempogramLog2WindowLength;
c@9	269 }
c@14	270 else if (identifier == "log2HopSize"){
c@18	271 return m_tempogramLog2HopSize;
c@14	272 }
c@14	273 else if (identifier == "log2FftLength"){
c@18	274 return m_tempogramLog2FftLength;
c@14	275 }
c@14	276 else if (identifier == "minBPM") {
c@18	277 return m_tempogramMinBPM;
c@9	278 }
c@14	279 else if (identifier == "maxBPM"){
c@18	280 return m_tempogramMaxBPM;
c@18	281 }
c@18	282 else if (identifier == "octDiv"){
c@18	283 return m_cyclicTempogramOctaveDivider;
c@0	284 }
c@51	285 else if (identifier == "refBPM"){
c@51	286 return m_cyclicTempogramReferenceBPM;
c@51	287 }
c@0	288
c@0	289 return 0;
c@0	290 }
c@0	291
c@0	292 void
c@14	293 TempogramPlugin::setParameter(string identifier, float value)
c@0	294 {
c@9	295
c@0	296 if (identifier == "C") {
c@18	297 m_noveltyCurveCompressionConstant = value; // set the actual value of your parameter
c@0	298 }
c@29	299 else if (identifier == "minDB"){
c@29	300 m_noveltyCurveMinDB = value;
c@29	301 }
c@14	302 else if (identifier == "log2TN") {
c@18	303 m_tempogramLog2WindowLength = value;
c@0	304 }
c@14	305 else if (identifier == "log2HopSize"){
c@30	306 m_tempogramLog2HopSize = value;
c@14	307 }
c@18	308 else if (identifier == "log2FftLength"){
c@30	309 m_tempogramLog2FftLength = value;
c@14	310 }
c@14	311 else if (identifier == "minBPM") {
c@18	312 m_tempogramMinBPM = value;
c@9	313 }
c@14	314 else if (identifier == "maxBPM"){
c@18	315 m_tempogramMaxBPM = value;
c@18	316 }
c@18	317 else if (identifier == "octDiv"){
c@18	318 m_cyclicTempogramOctaveDivider = value;
c@9	319 }
c@51	320 else if (identifier == "refBPM"){
c@51	321 m_cyclicTempogramReferenceBPM = value;
c@51	322 }
c@9	323
c@9	324 }
c@9	325
c@14	326 TempogramPlugin::ProgramList
c@14	327 TempogramPlugin::getPrograms() const
c@0	328 {
c@0	329 ProgramList list;
c@0	330
c@0	331 // If you have no programs, return an empty list (or simply don't
c@0	332 // implement this function or getCurrentProgram/selectProgram)
c@0	333
c@0	334 return list;
c@0	335 }
c@0	336
c@0	337 string
c@14	338 TempogramPlugin::getCurrentProgram() const
c@0	339 {
c@0	340 return ""; // no programs
c@0	341 }
c@0	342
c@0	343 void
c@14	344 TempogramPlugin::selectProgram(string name)
c@0	345 {
c@0	346 }
c@0	347
c@14	348 TempogramPlugin::OutputList
c@14	349 TempogramPlugin::getOutputDescriptors() const
c@0	350 {
c@0	351 OutputList list;
c@0	352
c@0	353 // See OutputDescriptor documentation for the possibilities here.
c@0	354 // Every plugin must have at least one output.
c@1	355
c@7	356 float d_sampleRate;
c@18	357 float tempogramInputSampleRate = (float)m_inputSampleRate/m_inputStepSize;
c@25	358 OutputDescriptor d1;
c@25	359 d1.identifier = "cyclicTempogram";
c@25	360 d1.name = "Cyclic Tempogram";
Chris@43	361 d1.description = "Cyclic tempogram calculated by \"octave folding\" the DFT tempogram";
c@25	362 d1.unit = "";
c@25	363 d1.hasFixedBinCount = true;
c@25	364 d1.binCount = m_cyclicTempogramOctaveDivider > 0 && !isnan(m_cyclicTempogramOctaveDivider) ? m_cyclicTempogramOctaveDivider : 0;
c@25	365 d1.hasKnownExtents = false;
c@25	366 d1.isQuantized = false;
c@25	367 d1.sampleType = OutputDescriptor::FixedSampleRate;
c@25	368 d_sampleRate = tempogramInputSampleRate/m_tempogramHopSize;
c@25	369 d1.sampleRate = d_sampleRate > 0.0 && !isnan(d_sampleRate) ? d_sampleRate : 0;
c@51	370 vector< vector <unsigned int> > logBins = calculateTempogramNearestNeighbourLogBins();
c@51	371 if (!logBins.empty()){
c@51	372 float scale = pow(2,floor(60/logBins[0][0]));
c@51	373
c@51	374 cerr << m_cyclicTempogramOctaveDivider << endl;
c@51	375 for(int i = 0; i < m_cyclicTempogramNumberOfOctaves; i++){
c@51	376 float s = fmod(binToBPM(logBins[0][i]), m_cyclicTempogramReferenceBPM)*scale;
c@51	377 d1.binNames.push_back(floatToString(s));
c@51	378 cerr << i << endl;
c@51	379 //cerr << m_cyclicTempogramOctaveDivider << " " << s << endl;
c@51	380 }
c@51	381 }
c@25	382 d1.hasDuration = false;
c@25	383 list.push_back(d1);
c@25	384
c@25	385 OutputDescriptor d2;
c@25	386 d2.identifier = "tempogramDFT";
c@25	387 d2.name = "Tempogram via DFT";
Chris@43	388 d2.description = "Tempogram calculated using Discrete Fourier Transform method";
Chris@43	389 d2.unit = ""; // unit of bin contents, not of "bin label", so not bpm
c@25	390 d2.hasFixedBinCount = true;
c@25	391 d2.binCount = m_tempogramMaxBin - m_tempogramMinBin + 1;
c@25	392 d2.hasKnownExtents = false;
c@25	393 d2.isQuantized = false;
c@25	394 d2.sampleType = OutputDescriptor::FixedSampleRate;
c@25	395 d_sampleRate = tempogramInputSampleRate/m_tempogramHopSize;
c@25	396 d2.sampleRate = d_sampleRate > 0.0 && !isnan(d_sampleRate) ? d_sampleRate : 0.0;
c@25	397 for(int i = m_tempogramMinBin; i <= (int)m_tempogramMaxBin; i++){
c@25	398 float w = ((float)i/m_tempogramFftLength)*(tempogramInputSampleRate);
c@25	399 d2.binNames.push_back(floatToString(w*60));
c@25	400 }
c@25	401 d2.hasDuration = false;
c@25	402 list.push_back(d2);
c@25	403
c@21	404 OutputDescriptor d3;
c@25	405 d3.identifier = "tempogramACT";
c@25	406 d3.name = "Tempogram via ACT";
Chris@43	407 d3.description = "Tempogram calculated using autocorrelation method";
Chris@43	408 d3.unit = ""; // unit of bin contents, not of "bin label", so not bpm
c@21	409 d3.hasFixedBinCount = true;
c@28	410 d3.binCount = m_tempogramMaxLag - m_tempogramMinLag + 1;
c@21	411 d3.hasKnownExtents = false;
c@21	412 d3.isQuantized = false;
c@21	413 d3.sampleType = OutputDescriptor::FixedSampleRate;
c@21	414 d_sampleRate = tempogramInputSampleRate/m_tempogramHopSize;
c@25	415 d3.sampleRate = d_sampleRate > 0.0 && !isnan(d_sampleRate) ? d_sampleRate : 0.0;
c@28	416 for(int lag = m_tempogramMaxLag; lag >= (int)m_tempogramMinLag; lag--){
c@28	417 d3.binNames.push_back(floatToString(60/(m_inputStepSize*(lag/m_inputSampleRate))));
c@25	418 }
c@21	419 d3.hasDuration = false;
c@21	420 list.push_back(d3);
c@21	421
c@25	422 OutputDescriptor d4;
c@25	423 d4.identifier = "nc";
c@25	424 d4.name = "Novelty Curve";
Chris@43	425 d4.description = "Novelty curve underlying the tempogram calculations";
c@25	426 d4.unit = "";
c@25	427 d4.hasFixedBinCount = true;
c@25	428 d4.binCount = 1;
c@25	429 d4.hasKnownExtents = false;
c@25	430 d4.isQuantized = false;
c@25	431 d4.sampleType = OutputDescriptor::FixedSampleRate;
c@9	432 d_sampleRate = tempogramInputSampleRate;
c@25	433 d4.sampleRate = d_sampleRate > 0 && !isnan(d_sampleRate) ? d_sampleRate : 0;
c@25	434 d4.hasDuration = false;
c@25	435 list.push_back(d4);
c@18	436
c@0	437 return list;
c@0	438 }
c@0	439
c@20	440 bool
c@20	441 TempogramPlugin::initialise(size_t channels, size_t stepSize, size_t blockSize)
c@20	442 {
c@20	443 if (channels < getMinChannelCount() \|\|
c@20	444 channels > getMaxChannelCount()) return false;
c@20	445
c@20	446 // Real initialisation work goes here!
c@20	447 m_inputBlockSize = blockSize;
c@20	448 m_inputStepSize = stepSize;
c@20	449
c@24	450 //m_spectrogram = Spectrogram(m_inputBlockSize/2 + 1);
c@21	451 if (!handleParameterValues()) return false;
c@19	452 //cout << m_cyclicTempogramOctaveDivider << endl;
c@4	453
c@0	454 return true;
c@0	455 }
c@0	456
c@0	457 void
c@14	458 TempogramPlugin::reset()
c@0	459 {
c@0	460 // Clear buffers, reset stored values, etc
c@19	461 m_spectrogram.clear();
c@21	462 handleParameterValues();
c@0	463 }
c@0	464
c@14	465 TempogramPlugin::FeatureSet
c@14	466 TempogramPlugin::process(const float const inputBuffers, Vamp::RealTime timestamp)
c@0	467 {
c@23	468 int n = m_inputBlockSize/2 + 1;
c@0	469 const float *in = inputBuffers[0];
c@3	470
c@9	471 //calculate magnitude of FrequencyDomain input
c@22	472 vector<float> fftCoefficients;
c@23	473 for (int i = 0; i < n; i++){
c@0	474 float magnitude = sqrt(in[2i] in[2i] + in[2i + 1] * in[2*i + 1]);
c@29	475 magnitude = magnitude > m_noveltyCurveMinV ? magnitude : m_noveltyCurveMinV;
c@22	476 fftCoefficients.push_back(magnitude);
c@0	477 }
c@22	478 m_spectrogram.push_back(fftCoefficients);
c@24	479 //m_spectrogram.push_back(fftCoefficients);
c@21	480
c@23	481 return FeatureSet();
c@0	482 }
c@0	483
c@14	484 TempogramPlugin::FeatureSet
c@14	485 TempogramPlugin::getRemainingFeatures()
c@11	486 {
c@0	487
c@18	488 float * hannWindow = new float[m_tempogramWindowLength];
c@20	489 for (int i = 0; i < (int)m_tempogramWindowLength; i++){
c@14	490 hannWindow[i] = 0.0;
c@4	491 }
c@11	492
c@1	493 FeatureSet featureSet;
c@0	494
c@19	495 //initialise novelty curve processor
c@23	496 int numberOfBlocks = m_spectrogram.size();
Chris@48	497
c@22	498 NoveltyCurveProcessor nc(m_inputSampleRate, m_inputBlockSize, m_noveltyCurveCompressionConstant);
c@21	499 vector<float> noveltyCurve = nc.spectrogramToNoveltyCurve(m_spectrogram); //calculate novelty curvefrom magnitude data
c@4	500
c@9	501 //push novelty curve data to featureset 1 and set timestamps
c@23	502 for (int i = 0; i < numberOfBlocks; i++){
c@19	503 Feature noveltyCurveFeature;
c@19	504 noveltyCurveFeature.values.push_back(noveltyCurve[i]);
c@19	505 noveltyCurveFeature.hasTimestamp = false;
c@25	506 featureSet[3].push_back(noveltyCurveFeature);
c@21	507 assert(!isnan(noveltyCurveFeature.values.back()));
c@4	508 }
c@4	509
c@9	510 //window function for spectrogram
c@18	511 WindowFunction::hanning(hannWindow, m_tempogramWindowLength);
c@9	512
c@9	513 //initialise spectrogram processor
c@18	514 SpectrogramProcessor spectrogramProcessor(m_tempogramWindowLength, m_tempogramFftLength, m_tempogramHopSize);
c@9	515 //compute spectrogram from novelty curve data (i.e., tempogram)
c@25	516 Tempogram tempogramDFT = spectrogramProcessor.process(&noveltyCurve[0], numberOfBlocks, hannWindow);
c@18	517 delete []hannWindow;
c@18	518 hannWindow = 0;
c@0	519
c@25	520 int tempogramLength = tempogramDFT.size();
c@7	521
c@9	522 //push tempogram data to featureset 0 and set timestamps.
c@7	523 for (int block = 0; block < tempogramLength; block++){
c@25	524 Feature tempogramDFTFeature;
c@28	525
c@28	526 assert(tempogramDFT[block].size() == (m_tempogramFftLength/2 + 1));
c@28	527 for(int k = m_tempogramMinBin; k <= (int)m_tempogramMaxBin; k++){
c@28	528 tempogramDFTFeature.values.push_back(tempogramDFT[block][k]);
c@28	529 }
c@28	530 tempogramDFTFeature.hasTimestamp = false;
c@28	531 featureSet[1].push_back(tempogramDFTFeature);
c@28	532 }
c@28	533
c@28	534 AutocorrelationProcessor autocorrelationProcessor(m_tempogramWindowLength, m_tempogramHopSize);
c@28	535 Tempogram tempogramACT = autocorrelationProcessor.process(&noveltyCurve[0], numberOfBlocks);
c@28	536
c@28	537 for (int block = 0; block < tempogramLength; block++){
c@25	538 Feature tempogramACTFeature;
Chris@44	539
c@28	540 for(int k = m_tempogramMaxLag; k >= (int)m_tempogramMinLag; k--){
c@25	541 tempogramACTFeature.values.push_back(tempogramACT[block][k]);
c@0	542 }
c@25	543 tempogramACTFeature.hasTimestamp = false;
c@25	544 featureSet[2].push_back(tempogramACTFeature);
c@0	545 }
c@0	546
c@18	547 //Calculate cyclic tempogram
c@22	548 vector< vector<unsigned int> > logBins = calculateTempogramNearestNeighbourLogBins();
c@18	549
c@22	550 //assert((int)logBins.size() == m_cyclicTempogramOctaveDivider*m_cyclicTempogramNumberOfOctaves);
c@18	551 for (int block = 0; block < tempogramLength; block++){
c@19	552 Feature cyclicTempogramFeature;
c@18	553
c@23	554 for (int i = 0; i < m_cyclicTempogramOctaveDivider; i++){
c@18	555 float sum = 0;
c@21	556
c@23	557 for (int j = 0; j < m_cyclicTempogramNumberOfOctaves; j++){
Chris@48	558 sum += tempogramDFT[block][logBins[j][i]];
c@18	559 }
c@19	560 cyclicTempogramFeature.values.push_back(sum/m_cyclicTempogramNumberOfOctaves);
c@21	561 assert(!isnan(cyclicTempogramFeature.values.back()));
c@18	562 }
c@18	563
c@19	564 cyclicTempogramFeature.hasTimestamp = false;
c@21	565 featureSet[0].push_back(cyclicTempogramFeature);
c@18	566 }
c@0	567
c@0	568 return featureSet;
c@0	569 }
c@22	570
c@22	571 vector< vector<unsigned int> > TempogramPlugin::calculateTempogramNearestNeighbourLogBins() const
c@22	572 {
c@22	573 vector< vector<unsigned int> > logBins;
c@22	574
c@22	575 for (int octave = 0; octave < (int)m_cyclicTempogramNumberOfOctaves; octave++){
c@22	576 vector<unsigned int> octaveBins;
Chris@47	577
c@22	578 for (int bin = 0; bin < (int)m_cyclicTempogramOctaveDivider; bin++){
c@22	579 float bpm = m_cyclicTempogramMinBPM*pow(2.0f, octave+(float)bin/m_cyclicTempogramOctaveDivider);
c@22	580 octaveBins.push_back(bpmToBin(bpm));
c@22	581 }
c@22	582 logBins.push_back(octaveBins);
c@22	583 }
c@22	584
c@22	585 return logBins;
c@22	586 }
c@22	587
c@22	588 unsigned int TempogramPlugin::bpmToBin(const float &bpm) const
c@22	589 {
c@22	590 float w = (float)bpm/60;
c@22	591 float sampleRate = m_inputSampleRate/m_inputStepSize;
c@22	592 int bin = floor((float)m_tempogramFftLength*w/sampleRate + 0.5);
c@22	593
c@22	594 if(bin < 0) bin = 0;
Chris@46	595 else if(bin > m_tempogramFftLength/2.0f) bin = m_tempogramFftLength/2.0f;
c@22	596
c@22	597 return bin;
c@22	598 }
c@22	599
c@22	600 float TempogramPlugin::binToBPM(const int &bin) const
c@22	601 {
c@22	602 float sampleRate = m_inputSampleRate/m_inputStepSize;
c@22	603
c@22	604 return (binsampleRate/m_tempogramFftLength)60;
c@22	605 }
c@22	606
c@22	607 bool TempogramPlugin::handleParameterValues(){
c@22	608
Chris@42	609 if (m_tempogramLog2HopSize <= 0) {
Chris@42	610 cerr << "Tempogram log2 hop size " << m_tempogramLog2HopSize
Chris@42	611 << " <= 0, failing initialise" << endl;
Chris@42	612 return false;
Chris@42	613 }
Chris@42	614 if (m_tempogramLog2FftLength <= 0) {
Chris@42	615 cerr << "Tempogram log2 fft length " << m_tempogramLog2FftLength
Chris@42	616 << " <= 0, failing initialise" << endl;
Chris@42	617 return false;
Chris@42	618 }
c@22	619
Chris@42	620 if (m_tempogramMinBPM < 1) {
Chris@42	621 m_tempogramMinBPM = 1;
Chris@42	622 }
c@22	623 if (m_tempogramMinBPM >= m_tempogramMaxBPM){
c@22	624 m_tempogramMinBPM = 30;
c@22	625 m_tempogramMaxBPM = 480;
c@22	626 }
c@22	627
c@29	628 m_noveltyCurveMinV = pow(10,(float)m_noveltyCurveMinDB/20);
c@29	629
c@29	630 m_tempogramWindowLength = pow(2,m_tempogramLog2WindowLength);
c@29	631 m_tempogramHopSize = pow(2,m_tempogramLog2HopSize);
c@29	632 m_tempogramFftLength = pow(2,m_tempogramLog2FftLength);
c@29	633
c@30	634 if (m_tempogramFftLength < m_tempogramWindowLength){
c@30	635 m_tempogramFftLength = m_tempogramWindowLength;
c@30	636 }
c@30	637
c@22	638 float tempogramInputSampleRate = (float)m_inputSampleRate/m_inputStepSize;
c@28	639 m_tempogramMinBin = (max((int)floor(((m_tempogramMinBPM/60)/tempogramInputSampleRate)*m_tempogramFftLength), 0));
c@28	640 m_tempogramMaxBin = (min((int)ceil(((m_tempogramMaxBPM/60)/tempogramInputSampleRate)*m_tempogramFftLength), (int)(m_tempogramFftLength/2)));
Chris@32	641
Chris@32	642 if (m_tempogramMaxBin < m_tempogramMinBin) {
Chris@32	643 cerr << "At audio sample rate " << m_inputSampleRate
Chris@32	644 << ", tempogram sample rate " << tempogramInputSampleRate
Chris@32	645 << " with bpm range " << m_tempogramMinBPM << " -> "
Chris@32	646 << m_tempogramMaxBPM << ", min bin = " << m_tempogramMinBin
Chris@32	647 << " > max bin " << m_tempogramMaxBin
Chris@32	648 << ": can't proceed, failing initialise" << endl;
Chris@32	649 return false;
Chris@32	650 }
c@28	651
c@28	652 m_tempogramMinLag = max((int)ceil((60/(m_inputStepSize * m_tempogramMaxBPM))*m_inputSampleRate), 0);
Chris@45	653 m_tempogramMaxLag = min((int)floor((60/(m_inputStepSize * m_tempogramMinBPM))*m_inputSampleRate), (int)m_tempogramWindowLength-1);
Chris@32	654
Chris@32	655 if (m_tempogramMaxLag < m_tempogramMinLag) {
Chris@32	656 cerr << "At audio sample rate " << m_inputSampleRate
Chris@32	657 << ", tempogram sample rate " << tempogramInputSampleRate
Chris@42	658 << ", window length " << m_tempogramWindowLength
Chris@32	659 << " with bpm range " << m_tempogramMinBPM << " -> "
Chris@42	660 << m_tempogramMaxBPM << ", min lag = " << m_tempogramMinLag
Chris@42	661 << " > max lag " << m_tempogramMaxLag
Chris@32	662 << ": can't proceed, failing initialise" << endl;
Chris@32	663 return false;
Chris@32	664 }
c@22	665
Chris@47	666 m_cyclicTempogramMinBPM = max(binToBPM(m_tempogramMinBin), m_tempogramMinBPM);
Chris@47	667 float cyclicTempogramMaxBPM = min(binToBPM(m_tempogramMaxBin), m_tempogramMaxBPM);
Chris@47	668
c@22	669 m_cyclicTempogramNumberOfOctaves = floor(log2(cyclicTempogramMaxBPM/m_cyclicTempogramMinBPM));
Chris@42	670
Chris@42	671 if (m_cyclicTempogramNumberOfOctaves < 1) {
Chris@42	672 cerr << "At audio sample rate " << m_inputSampleRate
Chris@42	673 << ", tempogram sample rate " << tempogramInputSampleRate
Chris@42	674 << " with bpm range " << m_tempogramMinBPM << " -> "
Chris@42	675 << m_tempogramMaxBPM << ", cyclic tempogram min bpm = "
Chris@42	676 << m_cyclicTempogramMinBPM << " and max bpm = "
Chris@42	677 << cyclicTempogramMaxBPM << " giving number of octaves = "
Chris@42	678 << m_cyclicTempogramNumberOfOctaves
Chris@42	679 << ": can't proceed, failing initialise" << endl;
Chris@42	680 return false;
Chris@42	681 }
c@22	682
c@22	683 return true;
c@22	684 }
c@22	685
c@22	686 string TempogramPlugin::floatToString(float value) const
c@22	687 {
c@22	688 ostringstream ss;
c@22	689
c@22	690 if(!(ss << value)) throw runtime_error("TempogramPlugin::floatToString(): invalid conversion from float to string");
c@22	691 return ss.str();
c@22	692 }

Mercurial > hg > vamp-tempogram

annotate TempogramPlugin.cpp @ 51:c7cc649dc9b6