c@116
|
1 /* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */
|
c@116
|
2 /*
|
c@116
|
3 Constant-Q library
|
c@116
|
4 Copyright (c) 2013-2014 Queen Mary, University of London
|
c@116
|
5
|
c@116
|
6 Permission is hereby granted, free of charge, to any person
|
c@116
|
7 obtaining a copy of this software and associated documentation
|
c@116
|
8 files (the "Software"), to deal in the Software without
|
c@116
|
9 restriction, including without limitation the rights to use, copy,
|
c@116
|
10 modify, merge, publish, distribute, sublicense, and/or sell copies
|
c@116
|
11 of the Software, and to permit persons to whom the Software is
|
c@116
|
12 furnished to do so, subject to the following conditions:
|
c@116
|
13
|
c@116
|
14 The above copyright notice and this permission notice shall be
|
c@116
|
15 included in all copies or substantial portions of the Software.
|
c@116
|
16
|
c@116
|
17 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
|
c@116
|
18 EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
|
c@116
|
19 MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
|
c@116
|
20 NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY
|
c@116
|
21 CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF
|
c@116
|
22 CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
|
c@116
|
23 WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
|
c@116
|
24
|
c@116
|
25 Except as contained in this notice, the names of the Centre for
|
c@116
|
26 Digital Music; Queen Mary, University of London; and Chris Cannam
|
c@116
|
27 shall not be used in advertising or otherwise to promote the sale,
|
c@116
|
28 use or other dealings in this Software without prior written
|
c@116
|
29 authorization.
|
c@116
|
30 */
|
c@116
|
31
|
c@116
|
32 #include "ConstantQ.h"
|
c@116
|
33
|
c@116
|
34 #include "CQKernel.h"
|
c@116
|
35
|
c@121
|
36 #include "dsp/Resampler.h"
|
c@121
|
37 #include "dsp/MathUtilities.h"
|
c@121
|
38 #include "dsp/FFT.h"
|
c@116
|
39
|
c@116
|
40 #include <algorithm>
|
c@116
|
41 #include <iostream>
|
c@116
|
42 #include <stdexcept>
|
c@116
|
43
|
c@164
|
44 #include <cmath>
|
c@164
|
45
|
c@116
|
46 using std::vector;
|
c@116
|
47 using std::cerr;
|
c@116
|
48 using std::endl;
|
c@116
|
49
|
c@116
|
50 //#define DEBUG_CQ 1
|
c@116
|
51
|
c@127
|
52 ConstantQ::ConstantQ(CQParameters params) :
|
c@127
|
53 m_inparams(params),
|
c@127
|
54 m_sampleRate(params.sampleRate),
|
c@127
|
55 m_maxFrequency(params.maxFrequency),
|
c@127
|
56 m_minFrequency(params.minFrequency),
|
c@127
|
57 m_binsPerOctave(params.binsPerOctave),
|
c@156
|
58 m_kernel(0),
|
c@116
|
59 m_fft(0)
|
c@116
|
60 {
|
c@127
|
61 if (m_minFrequency <= 0.0 || m_maxFrequency <= 0.0) {
|
c@116
|
62 throw std::invalid_argument("Frequency extents must be positive");
|
c@116
|
63 }
|
c@116
|
64
|
c@116
|
65 initialise();
|
c@116
|
66 }
|
c@116
|
67
|
c@116
|
68 ConstantQ::~ConstantQ()
|
c@116
|
69 {
|
c@116
|
70 delete m_fft;
|
c@116
|
71 for (int i = 0; i < (int)m_decimators.size(); ++i) {
|
c@116
|
72 delete m_decimators[i];
|
c@116
|
73 }
|
c@116
|
74 delete m_kernel;
|
c@116
|
75 }
|
c@116
|
76
|
c@116
|
77 double
|
c@116
|
78 ConstantQ::getMinFrequency() const
|
c@116
|
79 {
|
c@116
|
80 return m_p.minFrequency / pow(2.0, m_octaves - 1);
|
c@116
|
81 }
|
c@116
|
82
|
c@116
|
83 double
|
c@145
|
84 ConstantQ::getBinFrequency(double bin) const
|
c@116
|
85 {
|
c@137
|
86 // our bins are returned in high->low order
|
c@137
|
87 bin = (getBinsPerOctave() * getOctaves()) - bin - 1;
|
c@145
|
88 return getMinFrequency() * pow(2, (bin / getBinsPerOctave()));
|
c@116
|
89 }
|
c@116
|
90
|
c@116
|
91 void
|
c@116
|
92 ConstantQ::initialise()
|
c@116
|
93 {
|
c@164
|
94 m_octaves = int(ceil(log(m_maxFrequency / m_minFrequency) / log(2)));
|
c@150
|
95
|
c@150
|
96 if (m_octaves < 1) {
|
c@150
|
97 m_kernel = 0; // incidentally causing isValid() to return false
|
c@150
|
98 return;
|
c@150
|
99 }
|
c@150
|
100
|
c@127
|
101 m_kernel = new CQKernel(m_inparams);
|
c@116
|
102 m_p = m_kernel->getProperties();
|
c@116
|
103
|
c@147
|
104 if (!m_kernel->isValid()) {
|
c@147
|
105 return;
|
c@147
|
106 }
|
c@147
|
107
|
c@116
|
108 // Use exact powers of two for resampling rates. They don't have
|
c@116
|
109 // to be related to our actual samplerate: the resampler only
|
c@116
|
110 // cares about the ratio, but it only accepts integer source and
|
c@116
|
111 // target rates, and if we start from the actual samplerate we
|
c@116
|
112 // risk getting non-integer rates for lower octaves
|
c@116
|
113
|
c@116
|
114 int sourceRate = pow(2, m_octaves);
|
c@116
|
115 vector<int> latencies;
|
c@116
|
116
|
c@116
|
117 // top octave, no resampling
|
c@116
|
118 latencies.push_back(0);
|
c@116
|
119 m_decimators.push_back(0);
|
c@116
|
120
|
c@116
|
121 for (int i = 1; i < m_octaves; ++i) {
|
c@116
|
122
|
c@116
|
123 int factor = pow(2, i);
|
c@116
|
124
|
c@176
|
125 Resampler *r;
|
c@176
|
126
|
c@176
|
127 if (m_inparams.decimator == CQParameters::BetterDecimator) {
|
c@176
|
128 r = new Resampler
|
c@176
|
129 (sourceRate, sourceRate / factor, 50, 0.05);
|
c@176
|
130 } else {
|
c@176
|
131 r = new Resampler
|
c@176
|
132 (sourceRate, sourceRate / factor, 25, 0.3);
|
c@176
|
133 }
|
c@116
|
134
|
c@116
|
135 #ifdef DEBUG_CQ
|
c@116
|
136 cerr << "forward: octave " << i << ": resample from " << sourceRate << " to " << sourceRate / factor << endl;
|
c@116
|
137 #endif
|
c@116
|
138
|
c@116
|
139 // We need to adapt the latencies so as to get the first input
|
c@116
|
140 // sample to be aligned, in time, at the decimator output
|
c@116
|
141 // across all octaves.
|
c@116
|
142 //
|
c@116
|
143 // Our decimator uses a linear phase filter, but being causal
|
c@116
|
144 // it is not zero phase: it has a latency that depends on the
|
c@116
|
145 // decimation factor. Those latencies have been calculated
|
c@116
|
146 // per-octave and are available to us in the latencies
|
c@116
|
147 // array. Left to its own devices, the first input sample will
|
c@116
|
148 // appear at output sample 0 in the highest octave (where no
|
c@116
|
149 // decimation is needed), sample number latencies[1] in the
|
c@116
|
150 // next octave down, latencies[2] in the next one, etc. We get
|
c@116
|
151 // to apply some artificial per-octave latency after the
|
c@116
|
152 // decimator in the processing chain, in order to compensate
|
c@116
|
153 // for the differing latencies associated with different
|
c@116
|
154 // decimation factors. How much should we insert?
|
c@116
|
155 //
|
c@116
|
156 // The outputs of the decimators are at different rates (in
|
c@116
|
157 // terms of the relation between clock time and samples) and
|
c@116
|
158 // we want them aligned in terms of time. So, for example, a
|
c@116
|
159 // latency of 10 samples with a decimation factor of 2 is
|
c@116
|
160 // equivalent to a latency of 20 with no decimation -- they
|
c@116
|
161 // both result in the first output sample happening at the
|
c@116
|
162 // same equivalent time in milliseconds.
|
c@116
|
163 //
|
c@116
|
164 // So here we record the latency added by the decimator, in
|
c@116
|
165 // terms of the sample rate of the undecimated signal. Then we
|
c@116
|
166 // use that to compensate in a moment, when we've discovered
|
c@116
|
167 // what the longest latency across all octaves is.
|
c@116
|
168
|
c@116
|
169 latencies.push_back(r->getLatency() * factor);
|
c@116
|
170 m_decimators.push_back(r);
|
c@116
|
171 }
|
c@116
|
172
|
c@116
|
173 m_bigBlockSize = m_p.fftSize * pow(2, m_octaves - 1);
|
c@116
|
174
|
c@116
|
175 // Now add in the extra padding and compensate for hops that must
|
c@116
|
176 // be dropped in order to align the atom centres across
|
c@116
|
177 // octaves. Again this is a bit trickier because we are doing it
|
c@116
|
178 // at input rather than output and so must work in per-octave
|
c@116
|
179 // sample rates rather than output blocks
|
c@116
|
180
|
c@116
|
181 int emptyHops = m_p.firstCentre / m_p.atomSpacing;
|
c@116
|
182
|
c@116
|
183 vector<int> drops;
|
c@116
|
184 for (int i = 0; i < m_octaves; ++i) {
|
c@116
|
185 int factor = pow(2, i);
|
c@116
|
186 int dropHops = emptyHops * pow(2, m_octaves - i - 1) - emptyHops;
|
c@116
|
187 int drop = ((dropHops * m_p.fftHop) * factor) / m_p.atomsPerFrame;
|
c@116
|
188 drops.push_back(drop);
|
c@116
|
189 }
|
c@116
|
190
|
c@116
|
191 int maxLatPlusDrop = 0;
|
c@116
|
192 for (int i = 0; i < m_octaves; ++i) {
|
c@116
|
193 int latPlusDrop = latencies[i] + drops[i];
|
c@116
|
194 if (latPlusDrop > maxLatPlusDrop) maxLatPlusDrop = latPlusDrop;
|
c@116
|
195 }
|
c@116
|
196
|
c@116
|
197 int totalLatency = maxLatPlusDrop;
|
c@116
|
198
|
c@116
|
199 int lat0 = totalLatency - latencies[0] - drops[0];
|
c@116
|
200 totalLatency = ceil(double(lat0 / m_p.fftHop) * m_p.fftHop)
|
c@116
|
201 + latencies[0] + drops[0];
|
c@116
|
202
|
c@116
|
203 // We want (totalLatency - latencies[i]) to be a multiple of 2^i
|
c@116
|
204 // for each octave i, so that we do not end up with fractional
|
c@116
|
205 // octave latencies below. In theory this is hard, in practice if
|
c@116
|
206 // we ensure it for the last octave we should be OK.
|
c@116
|
207 double finalOctLat = latencies[m_octaves-1];
|
c@116
|
208 double finalOctFact = pow(2, m_octaves-1);
|
c@116
|
209 totalLatency =
|
c@164
|
210 int(finalOctLat +
|
c@164
|
211 finalOctFact *
|
c@164
|
212 ceil((totalLatency - finalOctLat) / finalOctFact) + .5);
|
c@116
|
213
|
c@116
|
214 #ifdef DEBUG_CQ
|
c@116
|
215 cerr << "total latency = " << totalLatency << endl;
|
c@116
|
216 #endif
|
c@116
|
217
|
c@116
|
218 // Padding as in the reference (will be introduced with the
|
c@116
|
219 // latency compensation in the loop below)
|
c@116
|
220 m_outputLatency = totalLatency + m_bigBlockSize
|
c@116
|
221 - m_p.firstCentre * pow(2, m_octaves-1);
|
c@116
|
222
|
c@116
|
223 #ifdef DEBUG_CQ
|
c@116
|
224 cerr << "m_bigBlockSize = " << m_bigBlockSize << ", firstCentre = "
|
c@116
|
225 << m_p.firstCentre << ", m_octaves = " << m_octaves
|
c@116
|
226 << ", so m_outputLatency = " << m_outputLatency << endl;
|
c@116
|
227 #endif
|
c@116
|
228
|
c@116
|
229 for (int i = 0; i < m_octaves; ++i) {
|
c@116
|
230
|
c@116
|
231 double factor = pow(2, i);
|
c@116
|
232
|
c@116
|
233 // Calculate the difference between the total latency applied
|
c@116
|
234 // across all octaves, and the existing latency due to the
|
c@116
|
235 // decimator for this octave, and then convert it back into
|
c@116
|
236 // the sample rate appropriate for the output latency of this
|
c@116
|
237 // decimator -- including one additional big block of padding
|
c@116
|
238 // (as in the reference).
|
c@116
|
239
|
c@116
|
240 double octaveLatency =
|
c@116
|
241 double(totalLatency - latencies[i] - drops[i]
|
c@116
|
242 + m_bigBlockSize) / factor;
|
c@116
|
243
|
c@116
|
244 #ifdef DEBUG_CQ
|
c@116
|
245 cerr << "octave " << i << ": resampler latency = " << latencies[i]
|
c@116
|
246 << ", drop " << drops[i] << " (/factor = " << drops[i]/factor
|
c@116
|
247 << "), octaveLatency = " << octaveLatency << " -> "
|
c@116
|
248 << int(round(octaveLatency)) << " (diff * factor = "
|
c@116
|
249 << (octaveLatency - round(octaveLatency)) << " * "
|
c@116
|
250 << factor << " = "
|
c@116
|
251 << (octaveLatency - round(octaveLatency)) * factor << ")" << endl;
|
c@116
|
252
|
c@116
|
253 cerr << "double(" << totalLatency << " - "
|
c@116
|
254 << latencies[i] << " - " << drops[i] << " + "
|
c@116
|
255 << m_bigBlockSize << ") / " << factor << " = "
|
c@116
|
256 << octaveLatency << endl;
|
c@116
|
257 #endif
|
c@116
|
258
|
c@116
|
259 m_buffers.push_back
|
c@164
|
260 (RealSequence(int(octaveLatency + 0.5), 0.0));
|
c@116
|
261 }
|
c@116
|
262
|
c@116
|
263 m_fft = new FFTReal(m_p.fftSize);
|
c@116
|
264 }
|
c@116
|
265
|
c@116
|
266 ConstantQ::ComplexBlock
|
c@116
|
267 ConstantQ::process(const RealSequence &td)
|
c@116
|
268 {
|
c@116
|
269 m_buffers[0].insert(m_buffers[0].end(), td.begin(), td.end());
|
c@116
|
270
|
c@116
|
271 for (int i = 1; i < m_octaves; ++i) {
|
c@116
|
272 RealSequence dec = m_decimators[i]->process(td.data(), td.size());
|
c@116
|
273 m_buffers[i].insert(m_buffers[i].end(), dec.begin(), dec.end());
|
c@116
|
274 }
|
c@116
|
275
|
c@116
|
276 ComplexBlock out;
|
c@116
|
277
|
c@116
|
278 while (true) {
|
c@116
|
279
|
c@116
|
280 // We could have quite different remaining sample counts in
|
c@116
|
281 // different octaves, because (apart from the predictable
|
c@116
|
282 // added counts for decimator output on each block) we also
|
c@116
|
283 // have variable additional latency per octave
|
c@116
|
284 bool enough = true;
|
c@116
|
285 for (int i = 0; i < m_octaves; ++i) {
|
c@116
|
286 int required = m_p.fftSize * pow(2, m_octaves - i - 1);
|
c@116
|
287 if ((int)m_buffers[i].size() < required) {
|
c@116
|
288 enough = false;
|
c@116
|
289 }
|
c@116
|
290 }
|
c@116
|
291 if (!enough) break;
|
c@116
|
292
|
c@116
|
293 int base = out.size();
|
c@116
|
294 int totalColumns = pow(2, m_octaves - 1) * m_p.atomsPerFrame;
|
c@116
|
295 for (int i = 0; i < totalColumns; ++i) {
|
c@116
|
296 out.push_back(ComplexColumn());
|
c@116
|
297 }
|
c@116
|
298
|
c@116
|
299 for (int octave = 0; octave < m_octaves; ++octave) {
|
c@116
|
300
|
c@116
|
301 int blocksThisOctave = pow(2, (m_octaves - octave - 1));
|
c@116
|
302
|
c@116
|
303 for (int b = 0; b < blocksThisOctave; ++b) {
|
c@116
|
304 ComplexBlock block = processOctaveBlock(octave);
|
c@116
|
305
|
c@116
|
306 for (int j = 0; j < m_p.atomsPerFrame; ++j) {
|
c@116
|
307
|
c@116
|
308 int target = base +
|
c@116
|
309 (b * (totalColumns / blocksThisOctave) +
|
c@116
|
310 (j * ((totalColumns / blocksThisOctave) /
|
c@116
|
311 m_p.atomsPerFrame)));
|
c@116
|
312
|
c@116
|
313 while (int(out[target].size()) <
|
c@116
|
314 m_p.binsPerOctave * (octave + 1)) {
|
c@116
|
315 out[target].push_back(Complex());
|
c@116
|
316 }
|
c@116
|
317
|
c@116
|
318 for (int i = 0; i < m_p.binsPerOctave; ++i) {
|
c@116
|
319 out[target][m_p.binsPerOctave * octave + i] =
|
c@116
|
320 block[j][m_p.binsPerOctave - i - 1];
|
c@116
|
321 }
|
c@116
|
322 }
|
c@116
|
323 }
|
c@116
|
324 }
|
c@116
|
325 }
|
c@116
|
326
|
c@116
|
327 return out;
|
c@116
|
328 }
|
c@116
|
329
|
c@116
|
330 ConstantQ::ComplexBlock
|
c@116
|
331 ConstantQ::getRemainingOutput()
|
c@116
|
332 {
|
c@116
|
333 // Same as padding added at start, though rounded up
|
c@116
|
334 int pad = ceil(double(m_outputLatency) / m_bigBlockSize) * m_bigBlockSize;
|
c@116
|
335 RealSequence zeros(pad, 0.0);
|
c@116
|
336 return process(zeros);
|
c@116
|
337 }
|
c@116
|
338
|
c@116
|
339 ConstantQ::ComplexBlock
|
c@116
|
340 ConstantQ::processOctaveBlock(int octave)
|
c@116
|
341 {
|
c@116
|
342 RealSequence ro(m_p.fftSize, 0.0);
|
c@116
|
343 RealSequence io(m_p.fftSize, 0.0);
|
c@116
|
344
|
c@116
|
345 m_fft->forward(m_buffers[octave].data(), ro.data(), io.data());
|
c@116
|
346
|
c@177
|
347 m_buffers[octave] = RealSequence(m_buffers[octave].begin() + m_p.fftHop,
|
c@177
|
348 m_buffers[octave].end());
|
c@116
|
349
|
c@177
|
350 ComplexSequence cv(m_p.fftSize);
|
c@116
|
351 for (int i = 0; i < m_p.fftSize; ++i) {
|
c@177
|
352 cv[i] = Complex(ro[i], io[i]);
|
c@116
|
353 }
|
c@116
|
354
|
c@116
|
355 ComplexSequence cqrowvec = m_kernel->processForward(cv);
|
c@116
|
356
|
c@116
|
357 // Reform into a column matrix
|
c@116
|
358 ComplexBlock cqblock;
|
c@116
|
359 for (int j = 0; j < m_p.atomsPerFrame; ++j) {
|
c@116
|
360 cqblock.push_back(ComplexColumn());
|
c@116
|
361 for (int i = 0; i < m_p.binsPerOctave; ++i) {
|
c@116
|
362 cqblock[j].push_back(cqrowvec[i * m_p.atomsPerFrame + j]);
|
c@116
|
363 }
|
c@116
|
364 }
|
c@116
|
365
|
c@116
|
366 return cqblock;
|
c@116
|
367 }
|
c@116
|
368
|
c@116
|
369
|