cannam@1
|
1 /* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */
|
cannam@1
|
2
|
cannam@1
|
3 /*
|
cannam@1
|
4 Vamp
|
cannam@1
|
5
|
cannam@1
|
6 An API for audio analysis and feature extraction plugins.
|
cannam@1
|
7
|
cannam@1
|
8 Centre for Digital Music, Queen Mary, University of London.
|
cannam@1
|
9 Copyright 2006 Chris Cannam.
|
cannam@16
|
10 FFT code from Don Cross's public domain FFT implementation.
|
cannam@1
|
11
|
cannam@1
|
12 Permission is hereby granted, free of charge, to any person
|
cannam@1
|
13 obtaining a copy of this software and associated documentation
|
cannam@1
|
14 files (the "Software"), to deal in the Software without
|
cannam@1
|
15 restriction, including without limitation the rights to use, copy,
|
cannam@1
|
16 modify, merge, publish, distribute, sublicense, and/or sell copies
|
cannam@1
|
17 of the Software, and to permit persons to whom the Software is
|
cannam@1
|
18 furnished to do so, subject to the following conditions:
|
cannam@1
|
19
|
cannam@1
|
20 The above copyright notice and this permission notice shall be
|
cannam@1
|
21 included in all copies or substantial portions of the Software.
|
cannam@1
|
22
|
cannam@1
|
23 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
|
cannam@1
|
24 EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
|
cannam@1
|
25 MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
|
cannam@6
|
26 NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS BE LIABLE FOR
|
cannam@1
|
27 ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF
|
cannam@1
|
28 CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
|
cannam@1
|
29 WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
|
cannam@1
|
30
|
cannam@1
|
31 Except as contained in this notice, the names of the Centre for
|
cannam@1
|
32 Digital Music; Queen Mary, University of London; and Chris Cannam
|
cannam@1
|
33 shall not be used in advertising or otherwise to promote the sale,
|
cannam@1
|
34 use or other dealings in this Software without prior written
|
cannam@1
|
35 authorization.
|
cannam@1
|
36 */
|
cannam@1
|
37
|
cannam@16
|
38 #include "PluginHostAdapter.h"
|
cannam@1
|
39 #include "vamp.h"
|
cannam@1
|
40
|
cannam@16
|
41 #include <iostream>
|
cannam@16
|
42 #include <sndfile.h>
|
cannam@1
|
43
|
cannam@1
|
44 #include "system.h"
|
cannam@1
|
45
|
cannam@19
|
46 #include <cmath>
|
cannam@19
|
47
|
cannam@16
|
48 using std::cout;
|
cannam@16
|
49 using std::cerr;
|
cannam@16
|
50 using std::endl;
|
cannam@16
|
51 using std::string;
|
cannam@16
|
52
|
cannam@16
|
53 void printFeatures(int, int, int, Vamp::Plugin::FeatureSet);
|
cannam@16
|
54 void transformInput(float *, size_t);
|
cannam@16
|
55 void fft(unsigned int, bool, double *, double *, double *, double *);
|
cannam@16
|
56
|
cannam@1
|
57 /*
|
cannam@16
|
58 A very simple Vamp plugin host. Given the name of a plugin
|
cannam@16
|
59 library and the name of a sound file on the command line, it loads
|
cannam@16
|
60 the first plugin in the library and runs it on the sound file,
|
cannam@16
|
61 dumping the plugin's first output to stdout.
|
cannam@1
|
62 */
|
cannam@1
|
63
|
cannam@1
|
64 int main(int argc, char **argv)
|
cannam@1
|
65 {
|
cannam@16
|
66 if (argc < 2 || argc > 4) {
|
cannam@16
|
67 cerr << "Usage: " << argv[0] << " pluginlibrary.so[:plugin] [file.wav] [outputno]" << endl;
|
cannam@1
|
68 return 2;
|
cannam@1
|
69 }
|
cannam@1
|
70
|
cannam@16
|
71 cerr << endl << argv[0] << ": Running..." << endl;
|
cannam@1
|
72
|
cannam@16
|
73 string soname = argv[1];
|
cannam@16
|
74 string plugname = "";
|
cannam@16
|
75 string wavname;
|
cannam@16
|
76 if (argc >= 3) wavname = argv[2];
|
cannam@16
|
77
|
cannam@16
|
78 if (soname.find(":") >= 0) {
|
cannam@16
|
79 plugname = soname.substr(soname.find(":") + 1);
|
cannam@16
|
80 soname = soname.substr(0, soname.find(":"));
|
cannam@16
|
81 }
|
cannam@1
|
82
|
cannam@1
|
83 void *libraryHandle = DLOPEN(soname, RTLD_LAZY);
|
cannam@1
|
84
|
cannam@1
|
85 if (!libraryHandle) {
|
cannam@16
|
86 cerr << argv[0] << ": Failed to open plugin library "
|
cannam@16
|
87 << soname << ": " << DLERROR() << endl;
|
cannam@1
|
88 return 1;
|
cannam@1
|
89 }
|
cannam@1
|
90
|
cannam@16
|
91 cerr << argv[0] << ": Opened plugin library " << soname << endl;
|
cannam@1
|
92
|
cannam@1
|
93 VampGetPluginDescriptorFunction fn = (VampGetPluginDescriptorFunction)
|
cannam@1
|
94 DLSYM(libraryHandle, "vampGetPluginDescriptor");
|
cannam@1
|
95
|
cannam@1
|
96 if (!fn) {
|
cannam@16
|
97 cerr << argv[0] << ": No Vamp descriptor function in library "
|
cannam@16
|
98 << soname << endl;
|
cannam@1
|
99 DLCLOSE(libraryHandle);
|
cannam@1
|
100 return 1;
|
cannam@1
|
101 }
|
cannam@1
|
102
|
cannam@16
|
103 cerr << argv[0] << ": Found plugin descriptor function" << endl;
|
cannam@1
|
104
|
cannam@1
|
105 int index = 0;
|
cannam@16
|
106 int plugnumber = -1;
|
cannam@1
|
107 const VampPluginDescriptor *descriptor = 0;
|
cannam@1
|
108
|
cannam@1
|
109 while ((descriptor = fn(index))) {
|
cannam@1
|
110
|
cannam@16
|
111 Vamp::PluginHostAdapter plugin(descriptor, 48000);
|
cannam@16
|
112 cerr << argv[0] << ": Plugin " << (index+1)
|
cannam@16
|
113 << " is \"" << plugin.getName() << "\"" << endl;
|
cannam@16
|
114
|
cannam@16
|
115 if (plugin.getName() == plugname) plugnumber = index;
|
cannam@1
|
116
|
cannam@1
|
117 ++index;
|
cannam@1
|
118 }
|
cannam@1
|
119
|
cannam@16
|
120 cerr << argv[0] << ": Done\n" << endl;
|
cannam@16
|
121
|
cannam@16
|
122 if (wavname == "") {
|
cannam@16
|
123 DLCLOSE(libraryHandle);
|
cannam@16
|
124 return 0;
|
cannam@16
|
125 }
|
cannam@16
|
126
|
cannam@16
|
127 if (plugnumber < 0) {
|
cannam@16
|
128 if (plugname != "") {
|
cannam@16
|
129 cerr << "ERROR: No such plugin as " << plugname << " in library"
|
cannam@16
|
130 << endl;
|
cannam@16
|
131 DLCLOSE(libraryHandle);
|
cannam@16
|
132 return 0;
|
cannam@16
|
133 } else {
|
cannam@16
|
134 plugnumber = 0;
|
cannam@16
|
135 }
|
cannam@16
|
136 }
|
cannam@16
|
137
|
cannam@16
|
138 descriptor = fn(plugnumber);
|
cannam@16
|
139 if (!descriptor) {
|
cannam@16
|
140 DLCLOSE(libraryHandle);
|
cannam@16
|
141 return 0;
|
cannam@16
|
142 }
|
cannam@16
|
143
|
cannam@16
|
144 SNDFILE *sndfile;
|
cannam@16
|
145 SF_INFO sfinfo;
|
cannam@16
|
146 memset(&sfinfo, 0, sizeof(SF_INFO));
|
cannam@16
|
147
|
cannam@16
|
148 sndfile = sf_open(wavname.c_str(), SFM_READ, &sfinfo);
|
cannam@16
|
149 if (!sndfile) {
|
cannam@16
|
150 cerr << "ERROR: Failed to open input file \"" << wavname << "\": "
|
cannam@16
|
151 << sf_strerror(sndfile) << endl;
|
cannam@16
|
152 DLCLOSE(libraryHandle);
|
cannam@16
|
153 return 1;
|
cannam@16
|
154 }
|
cannam@16
|
155
|
cannam@16
|
156 Vamp::PluginHostAdapter *plugin =
|
cannam@16
|
157 new Vamp::PluginHostAdapter(descriptor, sfinfo.samplerate);
|
cannam@16
|
158
|
cannam@16
|
159 cerr << "Running " << plugin->getName() << "..." << endl;
|
cannam@16
|
160
|
cannam@16
|
161 int blockSize = plugin->getPreferredBlockSize();
|
cannam@16
|
162 int stepSize = plugin->getPreferredStepSize();
|
cannam@16
|
163
|
cannam@16
|
164 cerr << "Preferred block size = " << blockSize << ", step size = "
|
cannam@16
|
165 << stepSize << endl;
|
cannam@16
|
166
|
cannam@16
|
167 if (blockSize == 0) blockSize = 1024;
|
cannam@16
|
168 if (stepSize == 0) stepSize = blockSize;
|
cannam@16
|
169
|
cannam@16
|
170 int channels = sfinfo.channels;
|
cannam@16
|
171
|
cannam@16
|
172 float *filebuf = new float[blockSize * channels];
|
cannam@16
|
173 float **plugbuf = new float*[channels];
|
cannam@16
|
174 for (int c = 0; c < channels; ++c) plugbuf[c] = new float[blockSize];
|
cannam@16
|
175
|
cannam@16
|
176 cerr << "Using block size = " << blockSize << ", step size = "
|
cannam@16
|
177 << stepSize << endl;
|
cannam@16
|
178
|
cannam@16
|
179 int minch = plugin->getMinChannelCount();
|
cannam@16
|
180 int maxch = plugin->getMaxChannelCount();
|
cannam@16
|
181 cerr << "Plugin accepts " << minch << " -> " << maxch << " channel(s)" << endl;
|
cannam@16
|
182
|
cannam@16
|
183 Vamp::Plugin::OutputList outputs = plugin->getOutputDescriptors();
|
cannam@16
|
184 Vamp::Plugin::OutputDescriptor od;
|
cannam@16
|
185
|
cannam@16
|
186 int output = 0;
|
cannam@16
|
187 if (argc == 4) output = atoi(argv[3]);
|
cannam@16
|
188
|
cannam@16
|
189 bool mix = false;
|
cannam@16
|
190
|
cannam@16
|
191 if (minch > channels || maxch < channels) {
|
cannam@16
|
192 if (minch == 1) {
|
cannam@16
|
193 cerr << "WARNING: Sound file has " << channels << " channels, mixing down to 1" << endl;
|
cannam@16
|
194 mix = true;
|
cannam@16
|
195 channels = 1;
|
cannam@16
|
196 } else {
|
cannam@16
|
197 cerr << "ERROR: Sound file has " << channels << " channels, out of range for plugin" << endl;
|
cannam@16
|
198 goto done;
|
cannam@16
|
199 }
|
cannam@16
|
200 }
|
cannam@16
|
201
|
cannam@16
|
202 if (outputs.empty()) {
|
cannam@16
|
203 cerr << "Plugin has no outputs!" << endl;
|
cannam@16
|
204 goto done;
|
cannam@16
|
205 }
|
cannam@16
|
206
|
cannam@16
|
207 if (int(outputs.size()) <= output) {
|
cannam@16
|
208 cerr << "Output " << output << " requested, but plugin has only " << outputs.size() << " output(s)" << endl;
|
cannam@16
|
209 goto done;
|
cannam@16
|
210 }
|
cannam@16
|
211
|
cannam@16
|
212 od = outputs[output];
|
cannam@16
|
213 cerr << "Output is " << od.name << endl;
|
cannam@16
|
214
|
cannam@16
|
215 plugin->initialise(channels, stepSize, blockSize);
|
cannam@16
|
216
|
cannam@16
|
217 for (size_t i = 0; i < sfinfo.frames; i += stepSize) {
|
cannam@16
|
218
|
cannam@16
|
219 int count;
|
cannam@16
|
220
|
cannam@16
|
221 if (sf_seek(sndfile, i, SEEK_SET) < 0) {
|
cannam@16
|
222 cerr << "ERROR: sf_seek failed: " << sf_strerror(sndfile) << endl;
|
cannam@16
|
223 break;
|
cannam@16
|
224 }
|
cannam@16
|
225
|
cannam@16
|
226 if ((count = sf_readf_float(sndfile, filebuf, blockSize)) < 0) {
|
cannam@16
|
227 cerr << "ERROR: sf_readf_float failed: " << sf_strerror(sndfile) << endl;
|
cannam@16
|
228 break;
|
cannam@16
|
229 }
|
cannam@16
|
230
|
cannam@16
|
231 for (int c = 0; c < channels; ++c) {
|
cannam@16
|
232 for (int j = 0; j < blockSize; ++j) {
|
cannam@16
|
233 plugbuf[c][j] = 0.0f;
|
cannam@16
|
234 }
|
cannam@16
|
235 }
|
cannam@16
|
236
|
cannam@16
|
237 for (int c = 0; c < sfinfo.channels; ++c) {
|
cannam@16
|
238 int tc = c;
|
cannam@16
|
239 if (mix) tc = 0;
|
cannam@16
|
240 for (int j = 0; j < blockSize && j < count; ++j) {
|
cannam@16
|
241 plugbuf[tc][j] += filebuf[j * channels + c];
|
cannam@16
|
242 }
|
cannam@16
|
243
|
cannam@16
|
244 if (plugin->getInputDomain() == Vamp::Plugin::FrequencyDomain) {
|
cannam@16
|
245 transformInput(plugbuf[tc], blockSize);
|
cannam@16
|
246 }
|
cannam@16
|
247 }
|
cannam@16
|
248
|
cannam@16
|
249 printFeatures
|
cannam@16
|
250 (i, sfinfo.samplerate, output, plugin->process
|
cannam@16
|
251 (plugbuf, Vamp::RealTime::frame2RealTime(i, sfinfo.samplerate)));
|
cannam@16
|
252 }
|
cannam@16
|
253
|
cannam@16
|
254 printFeatures(sfinfo.frames, sfinfo.samplerate, output,
|
cannam@16
|
255 plugin->getRemainingFeatures());
|
cannam@16
|
256
|
cannam@16
|
257 done:
|
cannam@16
|
258 delete plugin;
|
cannam@1
|
259
|
cannam@1
|
260 DLCLOSE(libraryHandle);
|
cannam@16
|
261 sf_close(sndfile);
|
cannam@1
|
262 return 0;
|
cannam@1
|
263 }
|
cannam@1
|
264
|
cannam@16
|
265 void
|
cannam@16
|
266 printFeatures(int frame, int sr, int output, Vamp::Plugin::FeatureSet features)
|
cannam@16
|
267 {
|
cannam@16
|
268 for (unsigned int i = 0; i < features[output].size(); ++i) {
|
cannam@16
|
269 Vamp::RealTime rt = Vamp::RealTime::frame2RealTime(frame, sr);
|
cannam@16
|
270 if (features[output][i].hasTimestamp) {
|
cannam@16
|
271 rt = features[output][i].timestamp;
|
cannam@16
|
272 }
|
cannam@16
|
273 cout << rt.toString() << ":";
|
cannam@16
|
274 for (unsigned int j = 0; j < features[output][i].values.size(); ++j) {
|
cannam@16
|
275 cout << " " << features[output][i].values[j];
|
cannam@16
|
276 }
|
cannam@16
|
277 cout << endl;
|
cannam@16
|
278 }
|
cannam@16
|
279 }
|
cannam@16
|
280
|
cannam@16
|
281 void
|
cannam@16
|
282 transformInput(float *buffer, size_t size)
|
cannam@16
|
283 {
|
cannam@16
|
284 double *inbuf = new double[size * 2];
|
cannam@16
|
285 double *outbuf = new double[size * 2];
|
cannam@16
|
286
|
cannam@16
|
287 // Copy across with Hanning window
|
cannam@16
|
288 for (size_t i = 0; i < size; ++i) {
|
cannam@16
|
289 inbuf[i] = double(buffer[i]) * (0.50 - 0.50 * cos(2 * M_PI * i / size));
|
cannam@16
|
290 inbuf[i + size] = 0.0;
|
cannam@16
|
291 }
|
cannam@16
|
292
|
cannam@16
|
293 for (size_t i = 0; i < size/2; ++i) {
|
cannam@16
|
294 double temp = inbuf[i];
|
cannam@16
|
295 inbuf[i] = inbuf[i + size/2];
|
cannam@16
|
296 inbuf[i + size/2] = temp;
|
cannam@16
|
297 }
|
cannam@16
|
298
|
cannam@16
|
299 fft(size, false, inbuf, inbuf + size, outbuf, outbuf + size);
|
cannam@16
|
300
|
cannam@16
|
301 for (size_t i = 0; i < size/2; ++i) {
|
cannam@16
|
302 buffer[i * 2] = outbuf[i];
|
cannam@16
|
303 buffer[i * 2 + 1] = outbuf[i + size];
|
cannam@16
|
304 }
|
cannam@16
|
305
|
cannam@16
|
306 delete inbuf;
|
cannam@16
|
307 delete outbuf;
|
cannam@16
|
308 }
|
cannam@16
|
309
|
cannam@16
|
310 void
|
cannam@16
|
311 fft(unsigned int n, bool inverse, double *ri, double *ii, double *ro, double *io)
|
cannam@16
|
312 {
|
cannam@16
|
313 if (!ri || !ro || !io) return;
|
cannam@16
|
314
|
cannam@16
|
315 unsigned int bits;
|
cannam@16
|
316 unsigned int i, j, k, m;
|
cannam@16
|
317 unsigned int blockSize, blockEnd;
|
cannam@16
|
318
|
cannam@16
|
319 double tr, ti;
|
cannam@16
|
320
|
cannam@16
|
321 if (n < 2) return;
|
cannam@16
|
322 if (n & (n-1)) return;
|
cannam@16
|
323
|
cannam@16
|
324 double angle = 2.0 * M_PI;
|
cannam@16
|
325 if (inverse) angle = -angle;
|
cannam@16
|
326
|
cannam@16
|
327 for (i = 0; ; ++i) {
|
cannam@16
|
328 if (n & (1 << i)) {
|
cannam@16
|
329 bits = i;
|
cannam@16
|
330 break;
|
cannam@16
|
331 }
|
cannam@16
|
332 }
|
cannam@16
|
333
|
cannam@16
|
334 static unsigned int tableSize = 0;
|
cannam@16
|
335 static int *table = 0;
|
cannam@16
|
336
|
cannam@16
|
337 if (tableSize != n) {
|
cannam@16
|
338
|
cannam@16
|
339 delete[] table;
|
cannam@16
|
340
|
cannam@16
|
341 table = new int[n];
|
cannam@16
|
342
|
cannam@16
|
343 for (i = 0; i < n; ++i) {
|
cannam@16
|
344
|
cannam@16
|
345 m = i;
|
cannam@16
|
346
|
cannam@16
|
347 for (j = k = 0; j < bits; ++j) {
|
cannam@16
|
348 k = (k << 1) | (m & 1);
|
cannam@16
|
349 m >>= 1;
|
cannam@16
|
350 }
|
cannam@16
|
351
|
cannam@16
|
352 table[i] = k;
|
cannam@16
|
353 }
|
cannam@16
|
354
|
cannam@16
|
355 tableSize = n;
|
cannam@16
|
356 }
|
cannam@16
|
357
|
cannam@16
|
358 if (ii) {
|
cannam@16
|
359 for (i = 0; i < n; ++i) {
|
cannam@16
|
360 ro[table[i]] = ri[i];
|
cannam@16
|
361 io[table[i]] = ii[i];
|
cannam@16
|
362 }
|
cannam@16
|
363 } else {
|
cannam@16
|
364 for (i = 0; i < n; ++i) {
|
cannam@16
|
365 ro[table[i]] = ri[i];
|
cannam@16
|
366 io[table[i]] = 0.0;
|
cannam@16
|
367 }
|
cannam@16
|
368 }
|
cannam@16
|
369
|
cannam@16
|
370 blockEnd = 1;
|
cannam@16
|
371
|
cannam@16
|
372 for (blockSize = 2; blockSize <= n; blockSize <<= 1) {
|
cannam@16
|
373
|
cannam@16
|
374 double delta = angle / (double)blockSize;
|
cannam@16
|
375 double sm2 = -sin(-2 * delta);
|
cannam@16
|
376 double sm1 = -sin(-delta);
|
cannam@16
|
377 double cm2 = cos(-2 * delta);
|
cannam@16
|
378 double cm1 = cos(-delta);
|
cannam@16
|
379 double w = 2 * cm1;
|
cannam@16
|
380 double ar[3], ai[3];
|
cannam@16
|
381
|
cannam@16
|
382 for (i = 0; i < n; i += blockSize) {
|
cannam@16
|
383
|
cannam@16
|
384 ar[2] = cm2;
|
cannam@16
|
385 ar[1] = cm1;
|
cannam@16
|
386
|
cannam@16
|
387 ai[2] = sm2;
|
cannam@16
|
388 ai[1] = sm1;
|
cannam@16
|
389
|
cannam@16
|
390 for (j = i, m = 0; m < blockEnd; j++, m++) {
|
cannam@16
|
391
|
cannam@16
|
392 ar[0] = w * ar[1] - ar[2];
|
cannam@16
|
393 ar[2] = ar[1];
|
cannam@16
|
394 ar[1] = ar[0];
|
cannam@16
|
395
|
cannam@16
|
396 ai[0] = w * ai[1] - ai[2];
|
cannam@16
|
397 ai[2] = ai[1];
|
cannam@16
|
398 ai[1] = ai[0];
|
cannam@16
|
399
|
cannam@16
|
400 k = j + blockEnd;
|
cannam@16
|
401 tr = ar[0] * ro[k] - ai[0] * io[k];
|
cannam@16
|
402 ti = ar[0] * io[k] + ai[0] * ro[k];
|
cannam@16
|
403
|
cannam@16
|
404 ro[k] = ro[j] - tr;
|
cannam@16
|
405 io[k] = io[j] - ti;
|
cannam@16
|
406
|
cannam@16
|
407 ro[j] += tr;
|
cannam@16
|
408 io[j] += ti;
|
cannam@16
|
409 }
|
cannam@16
|
410 }
|
cannam@16
|
411
|
cannam@16
|
412 blockEnd = blockSize;
|
cannam@16
|
413 }
|
cannam@16
|
414
|
cannam@16
|
415 if (inverse) {
|
cannam@16
|
416
|
cannam@16
|
417 double denom = (double)n;
|
cannam@16
|
418
|
cannam@16
|
419 for (i = 0; i < n; i++) {
|
cannam@16
|
420 ro[i] /= denom;
|
cannam@16
|
421 io[i] /= denom;
|
cannam@16
|
422 }
|
cannam@16
|
423 }
|
cannam@16
|
424 }
|
cannam@16
|
425
|
cannam@16
|
426
|