Mercurial > hg > svcore
comparison data/model/FFTModel.cpp @ 935:f960d67ce842 tonioni
Merge from branch warnfix_no_size_t
author | Chris Cannam |
---|---|
date | Wed, 18 Jun 2014 13:42:01 +0100 |
parents | 59e7fe1b1003 |
children | a8aed8a85e09 |
comparison
equal
deleted
inserted
replaced
925:3efc20c59a94 | 935:f960d67ce842 |
---|---|
29 #endif | 29 #endif |
30 | 30 |
31 FFTModel::FFTModel(const DenseTimeValueModel *model, | 31 FFTModel::FFTModel(const DenseTimeValueModel *model, |
32 int channel, | 32 int channel, |
33 WindowType windowType, | 33 WindowType windowType, |
34 size_t windowSize, | 34 int windowSize, |
35 size_t windowIncrement, | 35 int windowIncrement, |
36 size_t fftSize, | 36 int fftSize, |
37 bool polar, | 37 bool polar, |
38 StorageAdviser::Criteria criteria, | 38 StorageAdviser::Criteria criteria, |
39 size_t fillFromColumn) : | 39 int fillFromColumn) : |
40 //!!! ZoomConstraint! | 40 //!!! ZoomConstraint! |
41 m_server(0), | 41 m_server(0), |
42 m_xshift(0), | 42 m_xshift(0), |
43 m_yshift(0) | 43 m_yshift(0) |
44 { | 44 { |
54 criteria, | 54 criteria, |
55 fillFromColumn); | 55 fillFromColumn); |
56 | 56 |
57 if (!m_server) return; // caller should check isOK() | 57 if (!m_server) return; // caller should check isOK() |
58 | 58 |
59 size_t xratio = windowIncrement / m_server->getWindowIncrement(); | 59 int xratio = windowIncrement / m_server->getWindowIncrement(); |
60 size_t yratio = m_server->getFFTSize() / fftSize; | 60 int yratio = m_server->getFFTSize() / fftSize; |
61 | 61 |
62 while (xratio > 1) { | 62 while (xratio > 1) { |
63 if (xratio & 0x1) { | 63 if (xratio & 0x1) { |
64 cerr << "ERROR: FFTModel: Window increment ratio " | 64 cerr << "ERROR: FFTModel: Window increment ratio " |
65 << windowIncrement << " / " | 65 << windowIncrement << " / " |
103 | 103 |
104 FFTDataServer * | 104 FFTDataServer * |
105 FFTModel::getServer(const DenseTimeValueModel *model, | 105 FFTModel::getServer(const DenseTimeValueModel *model, |
106 int channel, | 106 int channel, |
107 WindowType windowType, | 107 WindowType windowType, |
108 size_t windowSize, | 108 int windowSize, |
109 size_t windowIncrement, | 109 int windowIncrement, |
110 size_t fftSize, | 110 int fftSize, |
111 bool polar, | 111 bool polar, |
112 StorageAdviser::Criteria criteria, | 112 StorageAdviser::Criteria criteria, |
113 size_t fillFromColumn) | 113 int fillFromColumn) |
114 { | 114 { |
115 // Obviously, an FFT model of channel C (where C != -1) of an | 115 // Obviously, an FFT model of channel C (where C != -1) of an |
116 // aggregate model is the same as the FFT model of the appropriate | 116 // aggregate model is the same as the FFT model of the appropriate |
117 // channel of whichever model that aggregate channel is drawn | 117 // channel of whichever model that aggregate channel is drawn |
118 // from. We should use that model here, in case we already have | 118 // from. We should use that model here, in case we already have |
157 polar, | 157 polar, |
158 criteria, | 158 criteria, |
159 fillFromColumn); | 159 fillFromColumn); |
160 } | 160 } |
161 | 161 |
162 size_t | 162 int |
163 FFTModel::getSampleRate() const | 163 FFTModel::getSampleRate() const |
164 { | 164 { |
165 return isOK() ? m_server->getModel()->getSampleRate() : 0; | 165 return isOK() ? m_server->getModel()->getSampleRate() : 0; |
166 } | 166 } |
167 | 167 |
168 FFTModel::Column | 168 FFTModel::Column |
169 FFTModel::getColumn(size_t x) const | 169 FFTModel::getColumn(int x) const |
170 { | 170 { |
171 Profiler profiler("FFTModel::getColumn", false); | 171 Profiler profiler("FFTModel::getColumn", false); |
172 | 172 |
173 Column result; | 173 Column result; |
174 | 174 |
175 result.clear(); | 175 result.clear(); |
176 size_t h = getHeight(); | 176 int h = getHeight(); |
177 result.reserve(h); | 177 result.reserve(h); |
178 | 178 |
179 #ifdef __GNUC__ | 179 #ifdef __GNUC__ |
180 float magnitudes[h]; | 180 float magnitudes[h]; |
181 #else | 181 #else |
182 float *magnitudes = (float *)alloca(h * sizeof(float)); | 182 float *magnitudes = (float *)alloca(h * sizeof(float)); |
183 #endif | 183 #endif |
184 | 184 |
185 if (m_server->getMagnitudesAt(x << m_xshift, magnitudes)) { | 185 if (m_server->getMagnitudesAt(x << m_xshift, magnitudes)) { |
186 | 186 |
187 for (size_t y = 0; y < h; ++y) { | 187 for (int y = 0; y < h; ++y) { |
188 result.push_back(magnitudes[y]); | 188 result.push_back(magnitudes[y]); |
189 } | 189 } |
190 | 190 |
191 } else { | 191 } else { |
192 for (size_t i = 0; i < h; ++i) result.push_back(0.f); | 192 for (int i = 0; i < h; ++i) result.push_back(0.f); |
193 } | 193 } |
194 | 194 |
195 return result; | 195 return result; |
196 } | 196 } |
197 | 197 |
198 QString | 198 QString |
199 FFTModel::getBinName(size_t n) const | 199 FFTModel::getBinName(int n) const |
200 { | 200 { |
201 size_t sr = getSampleRate(); | 201 int sr = getSampleRate(); |
202 if (!sr) return ""; | 202 if (!sr) return ""; |
203 QString name = tr("%1 Hz").arg((n * sr) / ((getHeight()-1) * 2)); | 203 QString name = tr("%1 Hz").arg((n * sr) / ((getHeight()-1) * 2)); |
204 return name; | 204 return name; |
205 } | 205 } |
206 | 206 |
207 bool | 207 bool |
208 FFTModel::estimateStableFrequency(size_t x, size_t y, float &frequency) | 208 FFTModel::estimateStableFrequency(int x, int y, float &frequency) |
209 { | 209 { |
210 if (!isOK()) return false; | 210 if (!isOK()) return false; |
211 | 211 |
212 size_t sampleRate = m_server->getModel()->getSampleRate(); | 212 int sampleRate = m_server->getModel()->getSampleRate(); |
213 | 213 |
214 size_t fftSize = m_server->getFFTSize() >> m_yshift; | 214 int fftSize = m_server->getFFTSize() >> m_yshift; |
215 frequency = (float(y) * sampleRate) / fftSize; | 215 frequency = (float(y) * sampleRate) / fftSize; |
216 | 216 |
217 if (x+1 >= getWidth()) return false; | 217 if (x+1 >= getWidth()) return false; |
218 | 218 |
219 // At frequency f, a phase shift of 2pi (one cycle) happens in 1/f sec. | 219 // At frequency f, a phase shift of 2pi (one cycle) happens in 1/f sec. |
226 // = 2pi * (h * b) / w. | 226 // = 2pi * (h * b) / w. |
227 | 227 |
228 float oldPhase = getPhaseAt(x, y); | 228 float oldPhase = getPhaseAt(x, y); |
229 float newPhase = getPhaseAt(x+1, y); | 229 float newPhase = getPhaseAt(x+1, y); |
230 | 230 |
231 size_t incr = getResolution(); | 231 int incr = getResolution(); |
232 | 232 |
233 float expectedPhase = oldPhase + (2.0 * M_PI * y * incr) / fftSize; | 233 float expectedPhase = oldPhase + (2.0 * M_PI * y * incr) / fftSize; |
234 | 234 |
235 float phaseError = princargf(newPhase - expectedPhase); | 235 float phaseError = princargf(newPhase - expectedPhase); |
236 | 236 |
245 | 245 |
246 return true; | 246 return true; |
247 } | 247 } |
248 | 248 |
249 FFTModel::PeakLocationSet | 249 FFTModel::PeakLocationSet |
250 FFTModel::getPeaks(PeakPickType type, size_t x, size_t ymin, size_t ymax) | 250 FFTModel::getPeaks(PeakPickType type, int x, int ymin, int ymax) |
251 { | 251 { |
252 Profiler profiler("FFTModel::getPeaks"); | 252 Profiler profiler("FFTModel::getPeaks"); |
253 | 253 |
254 FFTModel::PeakLocationSet peaks; | 254 FFTModel::PeakLocationSet peaks; |
255 if (!isOK()) return peaks; | 255 if (!isOK()) return peaks; |
268 float values[n]; | 268 float values[n]; |
269 #else | 269 #else |
270 float *values = (float *)alloca(n * sizeof(float)); | 270 float *values = (float *)alloca(n * sizeof(float)); |
271 #endif | 271 #endif |
272 getMagnitudesAt(x, values, minbin, maxbin - minbin + 1); | 272 getMagnitudesAt(x, values, minbin, maxbin - minbin + 1); |
273 for (size_t bin = ymin; bin <= ymax; ++bin) { | 273 for (int bin = ymin; bin <= ymax; ++bin) { |
274 if (bin == minbin || bin == maxbin) continue; | 274 if (bin == minbin || bin == maxbin) continue; |
275 if (values[bin - minbin] > values[bin - minbin - 1] && | 275 if (values[bin - minbin] > values[bin - minbin - 1] && |
276 values[bin - minbin] > values[bin - minbin + 1]) { | 276 values[bin - minbin] > values[bin - minbin + 1]) { |
277 peaks.insert(bin); | 277 peaks.insert(bin); |
278 } | 278 } |
289 // For peak picking we use a moving median window, picking the | 289 // For peak picking we use a moving median window, picking the |
290 // highest value within each continuous region of values that | 290 // highest value within each continuous region of values that |
291 // exceed the median. For pitch adaptivity, we adjust the window | 291 // exceed the median. For pitch adaptivity, we adjust the window |
292 // size to a roughly constant pitch range (about four tones). | 292 // size to a roughly constant pitch range (about four tones). |
293 | 293 |
294 size_t sampleRate = getSampleRate(); | 294 int sampleRate = getSampleRate(); |
295 | 295 |
296 std::deque<float> window; | 296 std::deque<float> window; |
297 std::vector<size_t> inrange; | 297 std::vector<int> inrange; |
298 float dist = 0.5; | 298 float dist = 0.5; |
299 | 299 |
300 size_t medianWinSize = getPeakPickWindowSize(type, sampleRate, ymin, dist); | 300 int medianWinSize = getPeakPickWindowSize(type, sampleRate, ymin, dist); |
301 size_t halfWin = medianWinSize/2; | 301 int halfWin = medianWinSize/2; |
302 | 302 |
303 size_t binmin; | 303 int binmin; |
304 if (ymin > halfWin) binmin = ymin - halfWin; | 304 if (ymin > halfWin) binmin = ymin - halfWin; |
305 else binmin = 0; | 305 else binmin = 0; |
306 | 306 |
307 size_t binmax; | 307 int binmax; |
308 if (ymax + halfWin < values.size()) binmax = ymax + halfWin; | 308 if (ymax + halfWin < values.size()) binmax = ymax + halfWin; |
309 else binmax = values.size()-1; | 309 else binmax = values.size()-1; |
310 | 310 |
311 size_t prevcentre = 0; | 311 int prevcentre = 0; |
312 | 312 |
313 for (size_t bin = binmin; bin <= binmax; ++bin) { | 313 for (int bin = binmin; bin <= binmax; ++bin) { |
314 | 314 |
315 float value = values[bin]; | 315 float value = values[bin]; |
316 | 316 |
317 window.push_back(value); | 317 window.push_back(value); |
318 | 318 |
319 // so-called median will actually be the dist*100'th percentile | 319 // so-called median will actually be the dist*100'th percentile |
320 medianWinSize = getPeakPickWindowSize(type, sampleRate, bin, dist); | 320 medianWinSize = getPeakPickWindowSize(type, sampleRate, bin, dist); |
321 halfWin = medianWinSize/2; | 321 halfWin = medianWinSize/2; |
322 | 322 |
323 while (window.size() > medianWinSize) { | 323 while ((int)window.size() > medianWinSize) { |
324 window.pop_front(); | 324 window.pop_front(); |
325 } | 325 } |
326 | 326 |
327 size_t actualSize = window.size(); | 327 int actualSize = window.size(); |
328 | 328 |
329 if (type == MajorPitchAdaptivePeaks) { | 329 if (type == MajorPitchAdaptivePeaks) { |
330 if (ymax + halfWin < values.size()) binmax = ymax + halfWin; | 330 if (ymax + halfWin < values.size()) binmax = ymax + halfWin; |
331 else binmax = values.size()-1; | 331 else binmax = values.size()-1; |
332 } | 332 } |
333 | 333 |
334 std::deque<float> sorted(window); | 334 std::deque<float> sorted(window); |
335 std::sort(sorted.begin(), sorted.end()); | 335 std::sort(sorted.begin(), sorted.end()); |
336 float median = sorted[int(sorted.size() * dist)]; | 336 float median = sorted[int(sorted.size() * dist)]; |
337 | 337 |
338 size_t centrebin = 0; | 338 int centrebin = 0; |
339 if (bin > actualSize/2) centrebin = bin - actualSize/2; | 339 if (bin > actualSize/2) centrebin = bin - actualSize/2; |
340 | 340 |
341 while (centrebin > prevcentre || bin == binmin) { | 341 while (centrebin > prevcentre || bin == binmin) { |
342 | 342 |
343 if (centrebin > prevcentre) ++prevcentre; | 343 if (centrebin > prevcentre) ++prevcentre; |
348 inrange.push_back(centrebin); | 348 inrange.push_back(centrebin); |
349 } | 349 } |
350 | 350 |
351 if (centre <= median || centrebin+1 == values.size()) { | 351 if (centre <= median || centrebin+1 == values.size()) { |
352 if (!inrange.empty()) { | 352 if (!inrange.empty()) { |
353 size_t peakbin = 0; | 353 int peakbin = 0; |
354 float peakval = 0.f; | 354 float peakval = 0.f; |
355 for (size_t i = 0; i < inrange.size(); ++i) { | 355 for (int i = 0; i < (int)inrange.size(); ++i) { |
356 if (i == 0 || values[inrange[i]] > peakval) { | 356 if (i == 0 || values[inrange[i]] > peakval) { |
357 peakval = values[inrange[i]]; | 357 peakval = values[inrange[i]]; |
358 peakbin = inrange[i]; | 358 peakbin = inrange[i]; |
359 } | 359 } |
360 } | 360 } |
370 } | 370 } |
371 | 371 |
372 return peaks; | 372 return peaks; |
373 } | 373 } |
374 | 374 |
375 size_t | 375 int |
376 FFTModel::getPeakPickWindowSize(PeakPickType type, size_t sampleRate, | 376 FFTModel::getPeakPickWindowSize(PeakPickType type, int sampleRate, |
377 size_t bin, float &percentile) const | 377 int bin, float &percentile) const |
378 { | 378 { |
379 percentile = 0.5; | 379 percentile = 0.5; |
380 if (type == MajorPeaks) return 10; | 380 if (type == MajorPeaks) return 10; |
381 if (bin == 0) return 3; | 381 if (bin == 0) return 3; |
382 | 382 |
383 size_t fftSize = m_server->getFFTSize() >> m_yshift; | 383 int fftSize = m_server->getFFTSize() >> m_yshift; |
384 float binfreq = (sampleRate * bin) / fftSize; | 384 float binfreq = (sampleRate * bin) / fftSize; |
385 float hifreq = Pitch::getFrequencyForPitch(73, 0, binfreq); | 385 float hifreq = Pitch::getFrequencyForPitch(73, 0, binfreq); |
386 | 386 |
387 int hibin = lrintf((hifreq * fftSize) / sampleRate); | 387 int hibin = lrintf((hifreq * fftSize) / sampleRate); |
388 int medianWinSize = hibin - bin; | 388 int medianWinSize = hibin - bin; |
392 | 392 |
393 return medianWinSize; | 393 return medianWinSize; |
394 } | 394 } |
395 | 395 |
396 FFTModel::PeakSet | 396 FFTModel::PeakSet |
397 FFTModel::getPeakFrequencies(PeakPickType type, size_t x, | 397 FFTModel::getPeakFrequencies(PeakPickType type, int x, |
398 size_t ymin, size_t ymax) | 398 int ymin, int ymax) |
399 { | 399 { |
400 Profiler profiler("FFTModel::getPeakFrequencies"); | 400 Profiler profiler("FFTModel::getPeakFrequencies"); |
401 | 401 |
402 PeakSet peaks; | 402 PeakSet peaks; |
403 if (!isOK()) return peaks; | 403 if (!isOK()) return peaks; |
404 PeakLocationSet locations = getPeaks(type, x, ymin, ymax); | 404 PeakLocationSet locations = getPeaks(type, x, ymin, ymax); |
405 | 405 |
406 size_t sampleRate = getSampleRate(); | 406 int sampleRate = getSampleRate(); |
407 size_t fftSize = m_server->getFFTSize() >> m_yshift; | 407 int fftSize = m_server->getFFTSize() >> m_yshift; |
408 size_t incr = getResolution(); | 408 int incr = getResolution(); |
409 | 409 |
410 // This duplicates some of the work of estimateStableFrequency to | 410 // This duplicates some of the work of estimateStableFrequency to |
411 // allow us to retrieve the phases in two separate vertical | 411 // allow us to retrieve the phases in two separate vertical |
412 // columns, instead of jumping back and forth between columns x and | 412 // columns, instead of jumping back and forth between columns x and |
413 // x+1, which may be significantly slower if re-seeking is needed | 413 // x+1, which may be significantly slower if re-seeking is needed |
416 for (PeakLocationSet::iterator i = locations.begin(); | 416 for (PeakLocationSet::iterator i = locations.begin(); |
417 i != locations.end(); ++i) { | 417 i != locations.end(); ++i) { |
418 phases.push_back(getPhaseAt(x, *i)); | 418 phases.push_back(getPhaseAt(x, *i)); |
419 } | 419 } |
420 | 420 |
421 size_t phaseIndex = 0; | 421 int phaseIndex = 0; |
422 for (PeakLocationSet::iterator i = locations.begin(); | 422 for (PeakLocationSet::iterator i = locations.begin(); |
423 i != locations.end(); ++i) { | 423 i != locations.end(); ++i) { |
424 float oldPhase = phases[phaseIndex]; | 424 float oldPhase = phases[phaseIndex]; |
425 float newPhase = getPhaseAt(x+1, *i); | 425 float newPhase = getPhaseAt(x+1, *i); |
426 float expectedPhase = oldPhase + (2.0 * M_PI * *i * incr) / fftSize; | 426 float expectedPhase = oldPhase + (2.0 * M_PI * *i * incr) / fftSize; |