Chris@43
|
1 /* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */
|
c@0
|
2
|
Chris@43
|
3 /*
|
Chris@43
|
4 Vamp Tempogram Plugin
|
Chris@43
|
5 Carl Bussey, Centre for Digital Music, Queen Mary University of London
|
Chris@43
|
6 Copyright 2014 Queen Mary University of London.
|
Chris@43
|
7
|
Chris@43
|
8 This program is free software; you can redistribute it and/or
|
Chris@43
|
9 modify it under the terms of the GNU General Public License as
|
Chris@43
|
10 published by the Free Software Foundation; either version 2 of the
|
Chris@43
|
11 License, or (at your option) any later version. See the file
|
Chris@43
|
12 COPYING included with this distribution for more information.
|
Chris@43
|
13 */
|
c@0
|
14
|
c@14
|
15 #include "TempogramPlugin.h"
|
c@25
|
16
|
c@0
|
17 using Vamp::FFT;
|
c@7
|
18 using Vamp::RealTime;
|
c@0
|
19 using namespace std;
|
c@0
|
20
|
c@14
|
21 TempogramPlugin::TempogramPlugin(float inputSampleRate) :
|
c@0
|
22 Plugin(inputSampleRate),
|
c@18
|
23 m_inputBlockSize(0), //host parameter
|
c@18
|
24 m_inputStepSize(0), //host parameter
|
c@29
|
25 m_noveltyCurveMinDB(-74), //parameter
|
c@29
|
26 m_noveltyCurveMinV(0), //set in initialise()
|
c@18
|
27 m_noveltyCurveCompressionConstant(1000), //parameter
|
c@18
|
28 m_tempogramLog2WindowLength(10), //parameter
|
c@29
|
29 m_tempogramWindowLength(0), //set in initialise()
|
c@18
|
30 m_tempogramLog2FftLength(m_tempogramLog2WindowLength), //parameter
|
c@29
|
31 m_tempogramFftLength(0), //set in initialise()
|
c@18
|
32 m_tempogramLog2HopSize(6), //parameter
|
c@29
|
33 m_tempogramHopSize(0), //set in initialise()
|
c@18
|
34 m_tempogramMinBPM(30), //parameter
|
c@18
|
35 m_tempogramMaxBPM(480), //parameter
|
c@18
|
36 m_tempogramMinBin(0), //set in initialise()
|
c@18
|
37 m_tempogramMaxBin(0), //set in initialise()
|
c@29
|
38 m_tempogramMinLag(0), //set in initialise()
|
c@29
|
39 m_tempogramMaxLag(0), //set in initialise()
|
c@18
|
40 m_cyclicTempogramMinBPM(30), //reset in initialise()
|
c@18
|
41 m_cyclicTempogramNumberOfOctaves(0), //set in initialise()
|
c@49
|
42 m_cyclicTempogramOctaveDivider(30), //parameter
|
c@50
|
43 m_cyclicTempogramReferenceBPM(60) //parameter
|
c@0
|
44
|
c@0
|
45 // Also be sure to set your plugin parameters (presumably stored
|
c@0
|
46 // in member variables) to their default values here -- the host
|
c@0
|
47 // will not do that for you
|
c@0
|
48 {
|
c@0
|
49 }
|
c@0
|
50
|
c@14
|
51 TempogramPlugin::~TempogramPlugin()
|
c@0
|
52 {
|
c@0
|
53 //delete stuff
|
c@0
|
54 }
|
c@0
|
55
|
c@0
|
56 string
|
c@14
|
57 TempogramPlugin::getIdentifier() const
|
c@0
|
58 {
|
c@0
|
59 return "tempogram";
|
c@0
|
60 }
|
c@0
|
61
|
c@0
|
62 string
|
c@14
|
63 TempogramPlugin::getName() const
|
c@0
|
64 {
|
c@0
|
65 return "Tempogram";
|
c@0
|
66 }
|
c@0
|
67
|
c@0
|
68 string
|
c@14
|
69 TempogramPlugin::getDescription() const
|
c@0
|
70 {
|
c@0
|
71 return "Cyclic Tempogram as described by Peter Grosche and Meinard Muller";
|
c@0
|
72 }
|
c@0
|
73
|
c@0
|
74 string
|
c@14
|
75 TempogramPlugin::getMaker() const
|
c@0
|
76 {
|
c@0
|
77 return "Carl Bussey";
|
c@0
|
78 }
|
c@0
|
79
|
c@0
|
80 int
|
c@14
|
81 TempogramPlugin::getPluginVersion() const
|
c@0
|
82 {
|
c@0
|
83 return 1;
|
c@0
|
84 }
|
c@0
|
85
|
c@0
|
86 string
|
c@14
|
87 TempogramPlugin::getCopyright() const
|
c@0
|
88 {
|
Chris@40
|
89 return "Copyright 2014 Queen Mary University of London. GPL licence.";
|
c@0
|
90 }
|
c@0
|
91
|
c@14
|
92 TempogramPlugin::InputDomain
|
c@14
|
93 TempogramPlugin::getInputDomain() const
|
c@0
|
94 {
|
c@0
|
95 return FrequencyDomain;
|
c@0
|
96 }
|
c@0
|
97
|
c@0
|
98 size_t
|
c@14
|
99 TempogramPlugin::getPreferredBlockSize() const
|
c@0
|
100 {
|
c@9
|
101 return 2048; // 0 means "I can handle any block size"
|
c@0
|
102 }
|
c@0
|
103
|
c@0
|
104 size_t
|
c@14
|
105 TempogramPlugin::getPreferredStepSize() const
|
c@0
|
106 {
|
c@9
|
107 return 1024; // 0 means "anything sensible"; in practice this
|
c@0
|
108 // means the same as the block size for TimeDomain
|
c@0
|
109 // plugins, or half of it for FrequencyDomain plugins
|
c@0
|
110 }
|
c@0
|
111
|
c@0
|
112 size_t
|
c@14
|
113 TempogramPlugin::getMinChannelCount() const
|
c@0
|
114 {
|
c@0
|
115 return 1;
|
c@0
|
116 }
|
c@0
|
117
|
c@0
|
118 size_t
|
c@14
|
119 TempogramPlugin::getMaxChannelCount() const
|
c@0
|
120 {
|
c@0
|
121 return 1;
|
c@0
|
122 }
|
c@0
|
123
|
c@14
|
124 TempogramPlugin::ParameterList
|
c@14
|
125 TempogramPlugin::getParameterDescriptors() const
|
c@0
|
126 {
|
c@0
|
127 ParameterList list;
|
c@0
|
128
|
c@0
|
129 // If the plugin has no adjustable parameters, return an empty
|
c@0
|
130 // list here (and there's no need to provide implementations of
|
c@0
|
131 // getParameter and setParameter in that case either).
|
c@0
|
132
|
c@0
|
133 // Note that it is your responsibility to make sure the parameters
|
c@0
|
134 // start off having their default values (e.g. in the constructor
|
c@0
|
135 // above). The host needs to know the default value so it can do
|
c@0
|
136 // things like provide a "reset to default" function, but it will
|
c@0
|
137 // not explicitly set your parameters to their defaults for you if
|
c@0
|
138 // they have not changed in the mean time.
|
c@0
|
139
|
c@14
|
140 ParameterDescriptor d1;
|
c@14
|
141 d1.identifier = "C";
|
c@15
|
142 d1.name = "Novelty Curve Spectrogram Compression Constant";
|
c@14
|
143 d1.description = "Spectrogram compression constant, C, used when retrieving the novelty curve from the audio.";
|
c@14
|
144 d1.unit = "";
|
c@14
|
145 d1.minValue = 2;
|
c@14
|
146 d1.maxValue = 10000;
|
c@14
|
147 d1.defaultValue = 1000;
|
c@14
|
148 d1.isQuantized = false;
|
c@14
|
149 list.push_back(d1);
|
c@29
|
150
|
c@29
|
151 ParameterDescriptor d2;
|
c@29
|
152 d2.identifier = "minDB";
|
c@29
|
153 d2.name = "Novelty Curve Minimum DB";
|
c@29
|
154 d2.description = "Spectrogram minimum DB used when removing unwanted peaks in the Spectrogram when retrieving the novelty curve from the audio.";
|
c@29
|
155 d2.unit = "";
|
c@29
|
156 d2.minValue = -100;
|
c@29
|
157 d2.maxValue = -50;
|
c@29
|
158 d2.defaultValue = -74;
|
c@29
|
159 d2.isQuantized = false;
|
c@29
|
160 list.push_back(d2);
|
c@9
|
161
|
c@14
|
162 ParameterDescriptor d3;
|
c@29
|
163 d3.identifier = "log2TN";
|
c@29
|
164 d3.name = "Tempogram Window Length";
|
c@29
|
165 d3.description = "FFT window length when analysing the novelty curve and extracting the tempogram time-frequency function.";
|
c@14
|
166 d3.unit = "";
|
c@29
|
167 d3.minValue = 7;
|
c@14
|
168 d3.maxValue = 12;
|
c@29
|
169 d3.defaultValue = 10;
|
c@14
|
170 d3.isQuantized = true;
|
c@14
|
171 d3.quantizeStep = 1;
|
c@14
|
172 for (int i = d3.minValue; i <= d3.maxValue; i++){
|
c@14
|
173 d3.valueNames.push_back(floatToString(pow((float)2,(float)i)));
|
c@14
|
174 }
|
c@14
|
175 list.push_back(d3);
|
c@9
|
176
|
c@14
|
177 ParameterDescriptor d4;
|
c@29
|
178 d4.identifier = "log2HopSize";
|
c@29
|
179 d4.name = "Tempogram Hopsize";
|
c@29
|
180 d4.description = "FFT hopsize when analysing the novelty curve and extracting the tempogram time-frequency function.";
|
c@14
|
181 d4.unit = "";
|
c@14
|
182 d4.minValue = 6;
|
c@14
|
183 d4.maxValue = 12;
|
c@29
|
184 d4.defaultValue = 6;
|
c@14
|
185 d4.isQuantized = true;
|
c@14
|
186 d4.quantizeStep = 1;
|
c@14
|
187 for (int i = d4.minValue; i <= d4.maxValue; i++){
|
c@14
|
188 d4.valueNames.push_back(floatToString(pow((float)2,(float)i)));
|
c@14
|
189 }
|
c@14
|
190 list.push_back(d4);
|
c@14
|
191
|
c@14
|
192 ParameterDescriptor d5;
|
c@29
|
193 d5.identifier = "log2FftLength";
|
c@29
|
194 d5.name = "Tempogram FFT Length";
|
c@29
|
195 d5.description = "FFT length when analysing the novelty curve and extracting the tempogram time-frequency function. This parameter determines the amount of zero padding.";
|
c@14
|
196 d5.unit = "";
|
c@29
|
197 d5.minValue = 6;
|
c@29
|
198 d5.maxValue = 12;
|
Chris@42
|
199 d5.defaultValue = 10;
|
c@14
|
200 d5.isQuantized = true;
|
c@29
|
201 d5.quantizeStep = 1;
|
c@29
|
202 for (int i = d5.minValue; i <= d5.maxValue; i++){
|
Chris@41
|
203 d5.valueNames.push_back(floatToString(pow((float)2,(float)i)));
|
c@29
|
204 }
|
c@14
|
205 list.push_back(d5);
|
c@14
|
206
|
c@14
|
207 ParameterDescriptor d6;
|
c@29
|
208 d6.identifier = "minBPM";
|
c@29
|
209 d6.name = "(Cyclic) Tempogram Minimum BPM";
|
c@29
|
210 d6.description = "The minimum BPM of the tempogram output bins.";
|
c@14
|
211 d6.unit = "";
|
c@29
|
212 d6.minValue = 0;
|
c@14
|
213 d6.maxValue = 2000;
|
c@29
|
214 d6.defaultValue = 30;
|
c@14
|
215 d6.isQuantized = true;
|
c@14
|
216 d6.quantizeStep = 5;
|
c@14
|
217 list.push_back(d6);
|
c@18
|
218
|
c@18
|
219 ParameterDescriptor d7;
|
c@29
|
220 d7.identifier = "maxBPM";
|
c@29
|
221 d7.name = "(Cyclic) Tempogram Maximum BPM";
|
c@29
|
222 d7.description = "The maximum BPM of the tempogram output bins.";
|
c@18
|
223 d7.unit = "";
|
c@29
|
224 d7.minValue = 30;
|
c@29
|
225 d7.maxValue = 2000;
|
c@29
|
226 d7.defaultValue = 480;
|
c@18
|
227 d7.isQuantized = true;
|
c@29
|
228 d7.quantizeStep = 5;
|
c@18
|
229 list.push_back(d7);
|
c@29
|
230
|
c@29
|
231 ParameterDescriptor d8;
|
c@29
|
232 d8.identifier = "octDiv";
|
c@29
|
233 d8.name = "Cyclic Tempogram Octave Divider";
|
c@29
|
234 d8.description = "The number bins within each octave.";
|
c@29
|
235 d8.unit = "";
|
c@29
|
236 d8.minValue = 5;
|
c@29
|
237 d8.maxValue = 60;
|
c@29
|
238 d8.defaultValue = 30;
|
c@29
|
239 d8.isQuantized = true;
|
c@29
|
240 d8.quantizeStep = 1;
|
c@29
|
241 list.push_back(d8);
|
c@51
|
242
|
c@51
|
243 ParameterDescriptor d9;
|
c@51
|
244 d8.identifier = "refBPM";
|
c@51
|
245 d8.name = "Cyclic Tempogram Reference Tempo";
|
c@51
|
246 d8.description = "The reference tempo used when calculating the Cyclic Tempogram parameter \'s\'.";
|
c@51
|
247 d8.unit = "";
|
c@51
|
248 d8.minValue = 5;
|
c@51
|
249 d8.maxValue = 60;
|
c@51
|
250 d8.defaultValue = 30;
|
c@51
|
251 d8.isQuantized = true;
|
c@51
|
252 d8.quantizeStep = 1;
|
c@51
|
253 list.push_back(d8);
|
c@0
|
254
|
c@0
|
255 return list;
|
c@0
|
256 }
|
c@0
|
257
|
c@0
|
258 float
|
c@14
|
259 TempogramPlugin::getParameter(string identifier) const
|
c@0
|
260 {
|
c@0
|
261 if (identifier == "C") {
|
c@18
|
262 return m_noveltyCurveCompressionConstant; // return the ACTUAL current value of your parameter here!
|
c@0
|
263 }
|
c@29
|
264 else if (identifier == "minDB"){
|
c@29
|
265 return m_noveltyCurveMinDB;
|
c@29
|
266 }
|
c@14
|
267 else if (identifier == "log2TN"){
|
c@18
|
268 return m_tempogramLog2WindowLength;
|
c@9
|
269 }
|
c@14
|
270 else if (identifier == "log2HopSize"){
|
c@18
|
271 return m_tempogramLog2HopSize;
|
c@14
|
272 }
|
c@14
|
273 else if (identifier == "log2FftLength"){
|
c@18
|
274 return m_tempogramLog2FftLength;
|
c@14
|
275 }
|
c@14
|
276 else if (identifier == "minBPM") {
|
c@18
|
277 return m_tempogramMinBPM;
|
c@9
|
278 }
|
c@14
|
279 else if (identifier == "maxBPM"){
|
c@18
|
280 return m_tempogramMaxBPM;
|
c@18
|
281 }
|
c@18
|
282 else if (identifier == "octDiv"){
|
c@18
|
283 return m_cyclicTempogramOctaveDivider;
|
c@0
|
284 }
|
c@51
|
285 else if (identifier == "refBPM"){
|
c@51
|
286 return m_cyclicTempogramReferenceBPM;
|
c@51
|
287 }
|
c@0
|
288
|
c@0
|
289 return 0;
|
c@0
|
290 }
|
c@0
|
291
|
c@0
|
292 void
|
c@14
|
293 TempogramPlugin::setParameter(string identifier, float value)
|
c@0
|
294 {
|
c@9
|
295
|
c@0
|
296 if (identifier == "C") {
|
c@18
|
297 m_noveltyCurveCompressionConstant = value; // set the actual value of your parameter
|
c@0
|
298 }
|
c@29
|
299 else if (identifier == "minDB"){
|
c@29
|
300 m_noveltyCurveMinDB = value;
|
c@29
|
301 }
|
c@14
|
302 else if (identifier == "log2TN") {
|
c@18
|
303 m_tempogramLog2WindowLength = value;
|
c@0
|
304 }
|
c@14
|
305 else if (identifier == "log2HopSize"){
|
c@30
|
306 m_tempogramLog2HopSize = value;
|
c@14
|
307 }
|
c@18
|
308 else if (identifier == "log2FftLength"){
|
c@30
|
309 m_tempogramLog2FftLength = value;
|
c@14
|
310 }
|
c@14
|
311 else if (identifier == "minBPM") {
|
c@18
|
312 m_tempogramMinBPM = value;
|
c@9
|
313 }
|
c@14
|
314 else if (identifier == "maxBPM"){
|
c@18
|
315 m_tempogramMaxBPM = value;
|
c@18
|
316 }
|
c@18
|
317 else if (identifier == "octDiv"){
|
c@18
|
318 m_cyclicTempogramOctaveDivider = value;
|
c@9
|
319 }
|
c@51
|
320 else if (identifier == "refBPM"){
|
c@51
|
321 m_cyclicTempogramReferenceBPM = value;
|
c@51
|
322 }
|
c@9
|
323
|
c@9
|
324 }
|
c@9
|
325
|
c@14
|
326 TempogramPlugin::ProgramList
|
c@14
|
327 TempogramPlugin::getPrograms() const
|
c@0
|
328 {
|
c@0
|
329 ProgramList list;
|
c@0
|
330
|
c@0
|
331 // If you have no programs, return an empty list (or simply don't
|
c@0
|
332 // implement this function or getCurrentProgram/selectProgram)
|
c@0
|
333
|
c@0
|
334 return list;
|
c@0
|
335 }
|
c@0
|
336
|
c@0
|
337 string
|
c@14
|
338 TempogramPlugin::getCurrentProgram() const
|
c@0
|
339 {
|
c@0
|
340 return ""; // no programs
|
c@0
|
341 }
|
c@0
|
342
|
c@0
|
343 void
|
c@14
|
344 TempogramPlugin::selectProgram(string name)
|
c@0
|
345 {
|
c@0
|
346 }
|
c@0
|
347
|
c@14
|
348 TempogramPlugin::OutputList
|
c@14
|
349 TempogramPlugin::getOutputDescriptors() const
|
c@0
|
350 {
|
c@0
|
351 OutputList list;
|
c@0
|
352
|
c@0
|
353 // See OutputDescriptor documentation for the possibilities here.
|
c@0
|
354 // Every plugin must have at least one output.
|
c@1
|
355
|
c@7
|
356 float d_sampleRate;
|
c@18
|
357 float tempogramInputSampleRate = (float)m_inputSampleRate/m_inputStepSize;
|
c@25
|
358 OutputDescriptor d1;
|
c@25
|
359 d1.identifier = "cyclicTempogram";
|
c@25
|
360 d1.name = "Cyclic Tempogram";
|
Chris@43
|
361 d1.description = "Cyclic tempogram calculated by \"octave folding\" the DFT tempogram";
|
c@25
|
362 d1.unit = "";
|
c@25
|
363 d1.hasFixedBinCount = true;
|
c@25
|
364 d1.binCount = m_cyclicTempogramOctaveDivider > 0 && !isnan(m_cyclicTempogramOctaveDivider) ? m_cyclicTempogramOctaveDivider : 0;
|
c@25
|
365 d1.hasKnownExtents = false;
|
c@25
|
366 d1.isQuantized = false;
|
c@25
|
367 d1.sampleType = OutputDescriptor::FixedSampleRate;
|
c@25
|
368 d_sampleRate = tempogramInputSampleRate/m_tempogramHopSize;
|
c@25
|
369 d1.sampleRate = d_sampleRate > 0.0 && !isnan(d_sampleRate) ? d_sampleRate : 0;
|
c@51
|
370 vector< vector <unsigned int> > logBins = calculateTempogramNearestNeighbourLogBins();
|
c@51
|
371 if (!logBins.empty()){
|
c@51
|
372 float scale = pow(2,floor(60/logBins[0][0]));
|
c@51
|
373
|
c@51
|
374 cerr << m_cyclicTempogramOctaveDivider << endl;
|
c@51
|
375 for(int i = 0; i < m_cyclicTempogramNumberOfOctaves; i++){
|
c@51
|
376 float s = fmod(binToBPM(logBins[0][i]), m_cyclicTempogramReferenceBPM)*scale;
|
c@51
|
377 d1.binNames.push_back(floatToString(s));
|
c@51
|
378 cerr << i << endl;
|
c@51
|
379 //cerr << m_cyclicTempogramOctaveDivider << " " << s << endl;
|
c@51
|
380 }
|
c@51
|
381 }
|
c@25
|
382 d1.hasDuration = false;
|
c@25
|
383 list.push_back(d1);
|
c@25
|
384
|
c@25
|
385 OutputDescriptor d2;
|
c@25
|
386 d2.identifier = "tempogramDFT";
|
c@25
|
387 d2.name = "Tempogram via DFT";
|
Chris@43
|
388 d2.description = "Tempogram calculated using Discrete Fourier Transform method";
|
Chris@43
|
389 d2.unit = ""; // unit of bin contents, not of "bin label", so not bpm
|
c@25
|
390 d2.hasFixedBinCount = true;
|
c@25
|
391 d2.binCount = m_tempogramMaxBin - m_tempogramMinBin + 1;
|
c@25
|
392 d2.hasKnownExtents = false;
|
c@25
|
393 d2.isQuantized = false;
|
c@25
|
394 d2.sampleType = OutputDescriptor::FixedSampleRate;
|
c@25
|
395 d_sampleRate = tempogramInputSampleRate/m_tempogramHopSize;
|
c@25
|
396 d2.sampleRate = d_sampleRate > 0.0 && !isnan(d_sampleRate) ? d_sampleRate : 0.0;
|
c@25
|
397 for(int i = m_tempogramMinBin; i <= (int)m_tempogramMaxBin; i++){
|
c@25
|
398 float w = ((float)i/m_tempogramFftLength)*(tempogramInputSampleRate);
|
c@25
|
399 d2.binNames.push_back(floatToString(w*60));
|
c@25
|
400 }
|
c@25
|
401 d2.hasDuration = false;
|
c@25
|
402 list.push_back(d2);
|
c@25
|
403
|
c@21
|
404 OutputDescriptor d3;
|
c@25
|
405 d3.identifier = "tempogramACT";
|
c@25
|
406 d3.name = "Tempogram via ACT";
|
Chris@43
|
407 d3.description = "Tempogram calculated using autocorrelation method";
|
Chris@43
|
408 d3.unit = ""; // unit of bin contents, not of "bin label", so not bpm
|
c@21
|
409 d3.hasFixedBinCount = true;
|
c@28
|
410 d3.binCount = m_tempogramMaxLag - m_tempogramMinLag + 1;
|
c@21
|
411 d3.hasKnownExtents = false;
|
c@21
|
412 d3.isQuantized = false;
|
c@21
|
413 d3.sampleType = OutputDescriptor::FixedSampleRate;
|
c@21
|
414 d_sampleRate = tempogramInputSampleRate/m_tempogramHopSize;
|
c@25
|
415 d3.sampleRate = d_sampleRate > 0.0 && !isnan(d_sampleRate) ? d_sampleRate : 0.0;
|
c@28
|
416 for(int lag = m_tempogramMaxLag; lag >= (int)m_tempogramMinLag; lag--){
|
c@28
|
417 d3.binNames.push_back(floatToString(60/(m_inputStepSize*(lag/m_inputSampleRate))));
|
c@25
|
418 }
|
c@21
|
419 d3.hasDuration = false;
|
c@21
|
420 list.push_back(d3);
|
c@21
|
421
|
c@25
|
422 OutputDescriptor d4;
|
c@25
|
423 d4.identifier = "nc";
|
c@25
|
424 d4.name = "Novelty Curve";
|
Chris@43
|
425 d4.description = "Novelty curve underlying the tempogram calculations";
|
c@25
|
426 d4.unit = "";
|
c@25
|
427 d4.hasFixedBinCount = true;
|
c@25
|
428 d4.binCount = 1;
|
c@25
|
429 d4.hasKnownExtents = false;
|
c@25
|
430 d4.isQuantized = false;
|
c@25
|
431 d4.sampleType = OutputDescriptor::FixedSampleRate;
|
c@9
|
432 d_sampleRate = tempogramInputSampleRate;
|
c@25
|
433 d4.sampleRate = d_sampleRate > 0 && !isnan(d_sampleRate) ? d_sampleRate : 0;
|
c@25
|
434 d4.hasDuration = false;
|
c@25
|
435 list.push_back(d4);
|
c@18
|
436
|
c@0
|
437 return list;
|
c@0
|
438 }
|
c@0
|
439
|
c@20
|
440 bool
|
c@20
|
441 TempogramPlugin::initialise(size_t channels, size_t stepSize, size_t blockSize)
|
c@20
|
442 {
|
c@20
|
443 if (channels < getMinChannelCount() ||
|
c@20
|
444 channels > getMaxChannelCount()) return false;
|
c@20
|
445
|
c@20
|
446 // Real initialisation work goes here!
|
c@20
|
447 m_inputBlockSize = blockSize;
|
c@20
|
448 m_inputStepSize = stepSize;
|
c@20
|
449
|
c@24
|
450 //m_spectrogram = Spectrogram(m_inputBlockSize/2 + 1);
|
c@21
|
451 if (!handleParameterValues()) return false;
|
c@19
|
452 //cout << m_cyclicTempogramOctaveDivider << endl;
|
c@4
|
453
|
c@0
|
454 return true;
|
c@0
|
455 }
|
c@0
|
456
|
c@0
|
457 void
|
c@14
|
458 TempogramPlugin::reset()
|
c@0
|
459 {
|
c@0
|
460 // Clear buffers, reset stored values, etc
|
c@19
|
461 m_spectrogram.clear();
|
c@21
|
462 handleParameterValues();
|
c@0
|
463 }
|
c@0
|
464
|
c@14
|
465 TempogramPlugin::FeatureSet
|
c@14
|
466 TempogramPlugin::process(const float *const *inputBuffers, Vamp::RealTime timestamp)
|
c@0
|
467 {
|
c@23
|
468 int n = m_inputBlockSize/2 + 1;
|
c@0
|
469 const float *in = inputBuffers[0];
|
c@3
|
470
|
c@9
|
471 //calculate magnitude of FrequencyDomain input
|
c@22
|
472 vector<float> fftCoefficients;
|
c@23
|
473 for (int i = 0; i < n; i++){
|
c@0
|
474 float magnitude = sqrt(in[2*i] * in[2*i] + in[2*i + 1] * in[2*i + 1]);
|
c@29
|
475 magnitude = magnitude > m_noveltyCurveMinV ? magnitude : m_noveltyCurveMinV;
|
c@22
|
476 fftCoefficients.push_back(magnitude);
|
c@0
|
477 }
|
c@22
|
478 m_spectrogram.push_back(fftCoefficients);
|
c@24
|
479 //m_spectrogram.push_back(fftCoefficients);
|
c@21
|
480
|
c@23
|
481 return FeatureSet();
|
c@0
|
482 }
|
c@0
|
483
|
c@14
|
484 TempogramPlugin::FeatureSet
|
c@14
|
485 TempogramPlugin::getRemainingFeatures()
|
c@11
|
486 {
|
c@0
|
487
|
c@18
|
488 float * hannWindow = new float[m_tempogramWindowLength];
|
c@20
|
489 for (int i = 0; i < (int)m_tempogramWindowLength; i++){
|
c@14
|
490 hannWindow[i] = 0.0;
|
c@4
|
491 }
|
c@11
|
492
|
c@1
|
493 FeatureSet featureSet;
|
c@0
|
494
|
c@19
|
495 //initialise novelty curve processor
|
c@23
|
496 int numberOfBlocks = m_spectrogram.size();
|
Chris@48
|
497
|
c@22
|
498 NoveltyCurveProcessor nc(m_inputSampleRate, m_inputBlockSize, m_noveltyCurveCompressionConstant);
|
c@21
|
499 vector<float> noveltyCurve = nc.spectrogramToNoveltyCurve(m_spectrogram); //calculate novelty curvefrom magnitude data
|
c@4
|
500
|
c@9
|
501 //push novelty curve data to featureset 1 and set timestamps
|
c@23
|
502 for (int i = 0; i < numberOfBlocks; i++){
|
c@19
|
503 Feature noveltyCurveFeature;
|
c@19
|
504 noveltyCurveFeature.values.push_back(noveltyCurve[i]);
|
c@19
|
505 noveltyCurveFeature.hasTimestamp = false;
|
c@25
|
506 featureSet[3].push_back(noveltyCurveFeature);
|
c@21
|
507 assert(!isnan(noveltyCurveFeature.values.back()));
|
c@4
|
508 }
|
c@4
|
509
|
c@9
|
510 //window function for spectrogram
|
c@18
|
511 WindowFunction::hanning(hannWindow, m_tempogramWindowLength);
|
c@9
|
512
|
c@9
|
513 //initialise spectrogram processor
|
c@18
|
514 SpectrogramProcessor spectrogramProcessor(m_tempogramWindowLength, m_tempogramFftLength, m_tempogramHopSize);
|
c@9
|
515 //compute spectrogram from novelty curve data (i.e., tempogram)
|
c@25
|
516 Tempogram tempogramDFT = spectrogramProcessor.process(&noveltyCurve[0], numberOfBlocks, hannWindow);
|
c@18
|
517 delete []hannWindow;
|
c@18
|
518 hannWindow = 0;
|
c@0
|
519
|
c@25
|
520 int tempogramLength = tempogramDFT.size();
|
c@7
|
521
|
c@9
|
522 //push tempogram data to featureset 0 and set timestamps.
|
c@7
|
523 for (int block = 0; block < tempogramLength; block++){
|
c@25
|
524 Feature tempogramDFTFeature;
|
c@28
|
525
|
c@28
|
526 assert(tempogramDFT[block].size() == (m_tempogramFftLength/2 + 1));
|
c@28
|
527 for(int k = m_tempogramMinBin; k <= (int)m_tempogramMaxBin; k++){
|
c@28
|
528 tempogramDFTFeature.values.push_back(tempogramDFT[block][k]);
|
c@28
|
529 }
|
c@28
|
530 tempogramDFTFeature.hasTimestamp = false;
|
c@28
|
531 featureSet[1].push_back(tempogramDFTFeature);
|
c@28
|
532 }
|
c@28
|
533
|
c@28
|
534 AutocorrelationProcessor autocorrelationProcessor(m_tempogramWindowLength, m_tempogramHopSize);
|
c@28
|
535 Tempogram tempogramACT = autocorrelationProcessor.process(&noveltyCurve[0], numberOfBlocks);
|
c@28
|
536
|
c@28
|
537 for (int block = 0; block < tempogramLength; block++){
|
c@25
|
538 Feature tempogramACTFeature;
|
Chris@44
|
539
|
c@28
|
540 for(int k = m_tempogramMaxLag; k >= (int)m_tempogramMinLag; k--){
|
c@25
|
541 tempogramACTFeature.values.push_back(tempogramACT[block][k]);
|
c@0
|
542 }
|
c@25
|
543 tempogramACTFeature.hasTimestamp = false;
|
c@25
|
544 featureSet[2].push_back(tempogramACTFeature);
|
c@0
|
545 }
|
c@0
|
546
|
c@18
|
547 //Calculate cyclic tempogram
|
c@22
|
548 vector< vector<unsigned int> > logBins = calculateTempogramNearestNeighbourLogBins();
|
c@18
|
549
|
c@22
|
550 //assert((int)logBins.size() == m_cyclicTempogramOctaveDivider*m_cyclicTempogramNumberOfOctaves);
|
c@18
|
551 for (int block = 0; block < tempogramLength; block++){
|
c@19
|
552 Feature cyclicTempogramFeature;
|
c@18
|
553
|
c@23
|
554 for (int i = 0; i < m_cyclicTempogramOctaveDivider; i++){
|
c@18
|
555 float sum = 0;
|
c@21
|
556
|
c@23
|
557 for (int j = 0; j < m_cyclicTempogramNumberOfOctaves; j++){
|
Chris@48
|
558 sum += tempogramDFT[block][logBins[j][i]];
|
c@18
|
559 }
|
c@19
|
560 cyclicTempogramFeature.values.push_back(sum/m_cyclicTempogramNumberOfOctaves);
|
c@21
|
561 assert(!isnan(cyclicTempogramFeature.values.back()));
|
c@18
|
562 }
|
c@18
|
563
|
c@19
|
564 cyclicTempogramFeature.hasTimestamp = false;
|
c@21
|
565 featureSet[0].push_back(cyclicTempogramFeature);
|
c@18
|
566 }
|
c@0
|
567
|
c@0
|
568 return featureSet;
|
c@0
|
569 }
|
c@22
|
570
|
c@22
|
571 vector< vector<unsigned int> > TempogramPlugin::calculateTempogramNearestNeighbourLogBins() const
|
c@22
|
572 {
|
c@22
|
573 vector< vector<unsigned int> > logBins;
|
c@22
|
574
|
c@22
|
575 for (int octave = 0; octave < (int)m_cyclicTempogramNumberOfOctaves; octave++){
|
c@22
|
576 vector<unsigned int> octaveBins;
|
Chris@47
|
577
|
c@22
|
578 for (int bin = 0; bin < (int)m_cyclicTempogramOctaveDivider; bin++){
|
c@22
|
579 float bpm = m_cyclicTempogramMinBPM*pow(2.0f, octave+(float)bin/m_cyclicTempogramOctaveDivider);
|
c@22
|
580 octaveBins.push_back(bpmToBin(bpm));
|
c@22
|
581 }
|
c@22
|
582 logBins.push_back(octaveBins);
|
c@22
|
583 }
|
c@22
|
584
|
c@22
|
585 return logBins;
|
c@22
|
586 }
|
c@22
|
587
|
c@22
|
588 unsigned int TempogramPlugin::bpmToBin(const float &bpm) const
|
c@22
|
589 {
|
c@22
|
590 float w = (float)bpm/60;
|
c@22
|
591 float sampleRate = m_inputSampleRate/m_inputStepSize;
|
c@22
|
592 int bin = floor((float)m_tempogramFftLength*w/sampleRate + 0.5);
|
c@22
|
593
|
c@22
|
594 if(bin < 0) bin = 0;
|
Chris@46
|
595 else if(bin > m_tempogramFftLength/2.0f) bin = m_tempogramFftLength/2.0f;
|
c@22
|
596
|
c@22
|
597 return bin;
|
c@22
|
598 }
|
c@22
|
599
|
c@22
|
600 float TempogramPlugin::binToBPM(const int &bin) const
|
c@22
|
601 {
|
c@22
|
602 float sampleRate = m_inputSampleRate/m_inputStepSize;
|
c@22
|
603
|
c@22
|
604 return (bin*sampleRate/m_tempogramFftLength)*60;
|
c@22
|
605 }
|
c@22
|
606
|
c@22
|
607 bool TempogramPlugin::handleParameterValues(){
|
c@22
|
608
|
Chris@42
|
609 if (m_tempogramLog2HopSize <= 0) {
|
Chris@42
|
610 cerr << "Tempogram log2 hop size " << m_tempogramLog2HopSize
|
Chris@42
|
611 << " <= 0, failing initialise" << endl;
|
Chris@42
|
612 return false;
|
Chris@42
|
613 }
|
Chris@42
|
614 if (m_tempogramLog2FftLength <= 0) {
|
Chris@42
|
615 cerr << "Tempogram log2 fft length " << m_tempogramLog2FftLength
|
Chris@42
|
616 << " <= 0, failing initialise" << endl;
|
Chris@42
|
617 return false;
|
Chris@42
|
618 }
|
c@22
|
619
|
Chris@42
|
620 if (m_tempogramMinBPM < 1) {
|
Chris@42
|
621 m_tempogramMinBPM = 1;
|
Chris@42
|
622 }
|
c@22
|
623 if (m_tempogramMinBPM >= m_tempogramMaxBPM){
|
c@22
|
624 m_tempogramMinBPM = 30;
|
c@22
|
625 m_tempogramMaxBPM = 480;
|
c@22
|
626 }
|
c@22
|
627
|
c@29
|
628 m_noveltyCurveMinV = pow(10,(float)m_noveltyCurveMinDB/20);
|
c@29
|
629
|
c@29
|
630 m_tempogramWindowLength = pow(2,m_tempogramLog2WindowLength);
|
c@29
|
631 m_tempogramHopSize = pow(2,m_tempogramLog2HopSize);
|
c@29
|
632 m_tempogramFftLength = pow(2,m_tempogramLog2FftLength);
|
c@29
|
633
|
c@30
|
634 if (m_tempogramFftLength < m_tempogramWindowLength){
|
c@30
|
635 m_tempogramFftLength = m_tempogramWindowLength;
|
c@30
|
636 }
|
c@30
|
637
|
c@22
|
638 float tempogramInputSampleRate = (float)m_inputSampleRate/m_inputStepSize;
|
c@28
|
639 m_tempogramMinBin = (max((int)floor(((m_tempogramMinBPM/60)/tempogramInputSampleRate)*m_tempogramFftLength), 0));
|
c@28
|
640 m_tempogramMaxBin = (min((int)ceil(((m_tempogramMaxBPM/60)/tempogramInputSampleRate)*m_tempogramFftLength), (int)(m_tempogramFftLength/2)));
|
Chris@32
|
641
|
Chris@32
|
642 if (m_tempogramMaxBin < m_tempogramMinBin) {
|
Chris@32
|
643 cerr << "At audio sample rate " << m_inputSampleRate
|
Chris@32
|
644 << ", tempogram sample rate " << tempogramInputSampleRate
|
Chris@32
|
645 << " with bpm range " << m_tempogramMinBPM << " -> "
|
Chris@32
|
646 << m_tempogramMaxBPM << ", min bin = " << m_tempogramMinBin
|
Chris@32
|
647 << " > max bin " << m_tempogramMaxBin
|
Chris@32
|
648 << ": can't proceed, failing initialise" << endl;
|
Chris@32
|
649 return false;
|
Chris@32
|
650 }
|
c@28
|
651
|
c@28
|
652 m_tempogramMinLag = max((int)ceil((60/(m_inputStepSize * m_tempogramMaxBPM))*m_inputSampleRate), 0);
|
Chris@45
|
653 m_tempogramMaxLag = min((int)floor((60/(m_inputStepSize * m_tempogramMinBPM))*m_inputSampleRate), (int)m_tempogramWindowLength-1);
|
Chris@32
|
654
|
Chris@32
|
655 if (m_tempogramMaxLag < m_tempogramMinLag) {
|
Chris@32
|
656 cerr << "At audio sample rate " << m_inputSampleRate
|
Chris@32
|
657 << ", tempogram sample rate " << tempogramInputSampleRate
|
Chris@42
|
658 << ", window length " << m_tempogramWindowLength
|
Chris@32
|
659 << " with bpm range " << m_tempogramMinBPM << " -> "
|
Chris@42
|
660 << m_tempogramMaxBPM << ", min lag = " << m_tempogramMinLag
|
Chris@42
|
661 << " > max lag " << m_tempogramMaxLag
|
Chris@32
|
662 << ": can't proceed, failing initialise" << endl;
|
Chris@32
|
663 return false;
|
Chris@32
|
664 }
|
c@22
|
665
|
Chris@47
|
666 m_cyclicTempogramMinBPM = max(binToBPM(m_tempogramMinBin), m_tempogramMinBPM);
|
Chris@47
|
667 float cyclicTempogramMaxBPM = min(binToBPM(m_tempogramMaxBin), m_tempogramMaxBPM);
|
Chris@47
|
668
|
c@22
|
669 m_cyclicTempogramNumberOfOctaves = floor(log2(cyclicTempogramMaxBPM/m_cyclicTempogramMinBPM));
|
Chris@42
|
670
|
Chris@42
|
671 if (m_cyclicTempogramNumberOfOctaves < 1) {
|
Chris@42
|
672 cerr << "At audio sample rate " << m_inputSampleRate
|
Chris@42
|
673 << ", tempogram sample rate " << tempogramInputSampleRate
|
Chris@42
|
674 << " with bpm range " << m_tempogramMinBPM << " -> "
|
Chris@42
|
675 << m_tempogramMaxBPM << ", cyclic tempogram min bpm = "
|
Chris@42
|
676 << m_cyclicTempogramMinBPM << " and max bpm = "
|
Chris@42
|
677 << cyclicTempogramMaxBPM << " giving number of octaves = "
|
Chris@42
|
678 << m_cyclicTempogramNumberOfOctaves
|
Chris@42
|
679 << ": can't proceed, failing initialise" << endl;
|
Chris@42
|
680 return false;
|
Chris@42
|
681 }
|
c@22
|
682
|
c@22
|
683 return true;
|
c@22
|
684 }
|
c@22
|
685
|
c@22
|
686 string TempogramPlugin::floatToString(float value) const
|
c@22
|
687 {
|
c@22
|
688 ostringstream ss;
|
c@22
|
689
|
c@22
|
690 if(!(ss << value)) throw runtime_error("TempogramPlugin::floatToString(): invalid conversion from float to string");
|
c@22
|
691 return ss.str();
|
c@22
|
692 }
|