Chris@0
|
1 /* -*- c-basic-offset: 4 -*- vi:set ts=8 sts=4 sw=4: */
|
Chris@0
|
2
|
Chris@0
|
3 /*
|
Chris@0
|
4 A waveform viewer and audio annotation editor.
|
Chris@5
|
5 Chris Cannam, Queen Mary University of London, 2005-2006
|
Chris@0
|
6
|
Chris@0
|
7 This is experimental software. Not for distribution.
|
Chris@0
|
8 */
|
Chris@0
|
9
|
Chris@30
|
10 #ifndef _SPECTROGRAM_LAYER_H_
|
Chris@30
|
11 #define _SPECTROGRAM_LAYER_H_
|
Chris@0
|
12
|
Chris@0
|
13 #include "base/Layer.h"
|
Chris@0
|
14 #include "base/Window.h"
|
Chris@0
|
15 #include "model/PowerOfSqrtTwoZoomConstraint.h"
|
Chris@0
|
16 #include "model/DenseTimeValueModel.h"
|
Chris@0
|
17
|
Chris@0
|
18 #include <QThread>
|
Chris@0
|
19 #include <QMutex>
|
Chris@0
|
20 #include <QWaitCondition>
|
Chris@0
|
21
|
Chris@0
|
22 #include <fftw3.h>
|
Chris@0
|
23
|
Chris@38
|
24 #include <stdint.h>
|
Chris@38
|
25
|
Chris@0
|
26 class View;
|
Chris@0
|
27 class QPainter;
|
Chris@0
|
28 class QImage;
|
Chris@0
|
29 class QPixmap;
|
Chris@0
|
30 class QTimer;
|
Chris@0
|
31 class RealTime;
|
Chris@0
|
32
|
Chris@0
|
33 /**
|
Chris@0
|
34 * SpectrogramLayer represents waveform data (obtained from a
|
Chris@0
|
35 * DenseTimeValueModel) in spectrogram form.
|
Chris@0
|
36 */
|
Chris@0
|
37
|
Chris@0
|
38 class SpectrogramLayer : public Layer,
|
Chris@31
|
39 public PowerOfSqrtTwoZoomConstraint
|
Chris@0
|
40 {
|
Chris@0
|
41 Q_OBJECT
|
Chris@0
|
42
|
Chris@0
|
43 public:
|
Chris@37
|
44 enum Configuration { FullRangeDb, MelodicRange, MelodicPeaks };
|
Chris@0
|
45
|
Chris@44
|
46 SpectrogramLayer(Configuration = FullRangeDb);
|
Chris@0
|
47 ~SpectrogramLayer();
|
Chris@0
|
48
|
Chris@0
|
49 virtual const ZoomConstraint *getZoomConstraint() const { return this; }
|
Chris@0
|
50 virtual const Model *getModel() const { return m_model; }
|
Chris@44
|
51 virtual void paint(View *v, QPainter &paint, QRect rect) const;
|
Chris@0
|
52
|
Chris@44
|
53 virtual int getVerticalScaleWidth(View *v, QPainter &) const;
|
Chris@44
|
54 virtual void paintVerticalScale(View *v, QPainter &paint, QRect rect) const;
|
Chris@0
|
55
|
Chris@44
|
56 virtual QString getFeatureDescription(View *v, QPoint &) const;
|
Chris@0
|
57
|
Chris@44
|
58 virtual bool snapToFeatureFrame(View *v, int &frame,
|
Chris@28
|
59 size_t &resolution,
|
Chris@28
|
60 SnapType snap) const;
|
Chris@13
|
61
|
Chris@0
|
62 void setModel(const DenseTimeValueModel *model);
|
Chris@0
|
63
|
Chris@0
|
64 virtual PropertyList getProperties() const;
|
Chris@0
|
65 virtual PropertyType getPropertyType(const PropertyName &) const;
|
Chris@0
|
66 virtual QString getPropertyGroupName(const PropertyName &) const;
|
Chris@0
|
67 virtual int getPropertyRangeAndValue(const PropertyName &,
|
Chris@0
|
68 int *min, int *max) const;
|
Chris@0
|
69 virtual QString getPropertyValueLabel(const PropertyName &,
|
Chris@0
|
70 int value) const;
|
Chris@0
|
71 virtual void setProperty(const PropertyName &, int value);
|
Chris@0
|
72
|
Chris@0
|
73 /**
|
Chris@0
|
74 * Specify the channel to use from the source model.
|
Chris@0
|
75 * A value of -1 means to mix all available channels.
|
Chris@0
|
76 * The default is channel 0.
|
Chris@0
|
77 */
|
Chris@0
|
78 void setChannel(int);
|
Chris@0
|
79 int getChannel() const;
|
Chris@0
|
80
|
Chris@0
|
81 void setWindowSize(size_t);
|
Chris@0
|
82 size_t getWindowSize() const;
|
Chris@0
|
83
|
Chris@0
|
84 void setWindowOverlap(size_t percent);
|
Chris@0
|
85 size_t getWindowOverlap() const;
|
Chris@0
|
86
|
Chris@0
|
87 void setWindowType(WindowType type);
|
Chris@0
|
88 WindowType getWindowType() const;
|
Chris@0
|
89
|
Chris@0
|
90 /**
|
Chris@0
|
91 * Set the gain multiplier for sample values in this view prior to
|
Chris@0
|
92 * FFT calculation.
|
Chris@0
|
93 *
|
Chris@0
|
94 * The default is 1.0.
|
Chris@0
|
95 */
|
Chris@0
|
96 void setGain(float gain);
|
Chris@0
|
97 float getGain() const;
|
Chris@0
|
98
|
Chris@37
|
99 /**
|
Chris@37
|
100 * Set the threshold for sample values to be shown in the FFT,
|
Chris@37
|
101 * in voltage units.
|
Chris@37
|
102 *
|
Chris@37
|
103 * The default is 0.0.
|
Chris@37
|
104 */
|
Chris@37
|
105 void setThreshold(float threshold);
|
Chris@37
|
106 float getThreshold() const;
|
Chris@37
|
107
|
Chris@37
|
108 void setMinFrequency(size_t);
|
Chris@37
|
109 size_t getMinFrequency() const;
|
Chris@37
|
110
|
Chris@0
|
111 void setMaxFrequency(size_t); // 0 -> no maximum
|
Chris@0
|
112 size_t getMaxFrequency() const;
|
Chris@0
|
113
|
Chris@37
|
114 enum ColourScale {
|
Chris@37
|
115 LinearColourScale,
|
Chris@37
|
116 MeterColourScale,
|
Chris@37
|
117 dBColourScale,
|
Chris@37
|
118 PhaseColourScale
|
Chris@37
|
119 };
|
Chris@0
|
120
|
Chris@0
|
121 /**
|
Chris@0
|
122 * Specify the scale for sample levels. See WaveformLayer for
|
Chris@0
|
123 * details of meter and dB scaling. The default is dBColourScale.
|
Chris@0
|
124 */
|
Chris@0
|
125 void setColourScale(ColourScale);
|
Chris@0
|
126 ColourScale getColourScale() const;
|
Chris@0
|
127
|
Chris@35
|
128 enum FrequencyScale {
|
Chris@35
|
129 LinearFrequencyScale,
|
Chris@35
|
130 LogFrequencyScale
|
Chris@35
|
131 };
|
Chris@0
|
132
|
Chris@0
|
133 /**
|
Chris@0
|
134 * Specify the scale for the y axis.
|
Chris@0
|
135 */
|
Chris@0
|
136 void setFrequencyScale(FrequencyScale);
|
Chris@0
|
137 FrequencyScale getFrequencyScale() const;
|
Chris@0
|
138
|
Chris@37
|
139 enum BinDisplay {
|
Chris@37
|
140 AllBins,
|
Chris@37
|
141 PeakBins,
|
Chris@37
|
142 PeakFrequencies
|
Chris@35
|
143 };
|
Chris@35
|
144
|
Chris@35
|
145 /**
|
Chris@35
|
146 * Specify the processing of frequency bins for the y axis.
|
Chris@35
|
147 */
|
Chris@37
|
148 void setBinDisplay(BinDisplay);
|
Chris@37
|
149 BinDisplay getBinDisplay() const;
|
Chris@35
|
150
|
Chris@36
|
151 void setNormalizeColumns(bool n);
|
Chris@36
|
152 bool getNormalizeColumns() const;
|
Chris@36
|
153
|
Chris@0
|
154 enum ColourScheme { DefaultColours, WhiteOnBlack, BlackOnWhite,
|
Chris@40
|
155 RedOnBlue, YellowOnBlack, Rainbow };
|
Chris@0
|
156
|
Chris@0
|
157 void setColourScheme(ColourScheme scheme);
|
Chris@0
|
158 ColourScheme getColourScheme() const;
|
Chris@0
|
159
|
Chris@9
|
160 /**
|
Chris@9
|
161 * Specify the colourmap rotation for the colour scale.
|
Chris@9
|
162 */
|
Chris@9
|
163 void setColourRotation(int);
|
Chris@9
|
164 int getColourRotation() const;
|
Chris@9
|
165
|
Chris@0
|
166 virtual VerticalPosition getPreferredFrameCountPosition() const {
|
Chris@0
|
167 return PositionTop;
|
Chris@0
|
168 }
|
Chris@0
|
169
|
Chris@15
|
170 virtual bool isLayerOpaque() const { return true; }
|
Chris@15
|
171
|
Chris@44
|
172 float getYForFrequency(View *v, float frequency) const;
|
Chris@44
|
173 float getFrequencyForY(View *v, int y) const;
|
Chris@42
|
174
|
Chris@0
|
175 virtual int getCompletion() const;
|
Chris@0
|
176
|
Chris@6
|
177 virtual QString toXmlString(QString indent = "",
|
Chris@6
|
178 QString extraAttributes = "") const;
|
Chris@6
|
179
|
Chris@11
|
180 void setProperties(const QXmlAttributes &attributes);
|
Chris@11
|
181
|
Chris@44
|
182 virtual void setLayerDormant(const bool dormant);
|
Chris@29
|
183
|
Chris@0
|
184 protected slots:
|
Chris@0
|
185 void cacheInvalid();
|
Chris@0
|
186 void cacheInvalid(size_t startFrame, size_t endFrame);
|
Chris@0
|
187
|
Chris@0
|
188 void fillTimerTimedOut();
|
Chris@0
|
189
|
Chris@0
|
190 protected:
|
Chris@0
|
191 const DenseTimeValueModel *m_model; // I do not own this
|
Chris@0
|
192
|
Chris@35
|
193 int m_channel;
|
Chris@35
|
194 size_t m_windowSize;
|
Chris@35
|
195 WindowType m_windowType;
|
Chris@35
|
196 size_t m_windowOverlap;
|
Chris@35
|
197 float m_gain;
|
Chris@37
|
198 float m_threshold;
|
Chris@35
|
199 int m_colourRotation;
|
Chris@37
|
200 size_t m_minFrequency;
|
Chris@35
|
201 size_t m_maxFrequency;
|
Chris@35
|
202 ColourScale m_colourScale;
|
Chris@35
|
203 ColourScheme m_colourScheme;
|
Chris@35
|
204 FrequencyScale m_frequencyScale;
|
Chris@37
|
205 BinDisplay m_binDisplay;
|
Chris@36
|
206 bool m_normalizeColumns;
|
Chris@0
|
207
|
Chris@38
|
208 // At the moment we cache one unsigned char per bin for the
|
Chris@38
|
209 // magnitude -- which is nothing like precise enough to allow us
|
Chris@38
|
210 // to subsequently adjust gain etc without recalculating the
|
Chris@38
|
211 // cached values -- plus optionally one unsigned char per bin for
|
Chris@38
|
212 // phase-adjusted frequency.
|
Chris@37
|
213
|
Chris@38
|
214 // To speed up redrawing after parameter changes, we would like to
|
Chris@38
|
215 // cache magnitude in a way that can have gain applied afterwards
|
Chris@38
|
216 // and can determine whether something is a peak or not, and also
|
Chris@38
|
217 // cache phase rather than only phase-adjusted frequency so that
|
Chris@38
|
218 // we don't have to recalculate if switching between phase and
|
Chris@38
|
219 // magnitude displays.
|
Chris@38
|
220
|
Chris@38
|
221 // This implies probably 16 bits for a normalized magnitude (in
|
Chris@38
|
222 // dB?) and at most 16 bits for phase. 16 or 32 bits per bin
|
Chris@38
|
223 // instead of 8 or 16.
|
Chris@38
|
224
|
Chris@38
|
225 // Each column's magnitudes are expected to be stored normalized
|
Chris@38
|
226 // to [0,1] with respect to the column, so the normalization
|
Chris@38
|
227 // factor should be calculated before all values in a column, and
|
Chris@38
|
228 // set appropriately.
|
Chris@38
|
229
|
Chris@31
|
230 class Cache {
|
Chris@31
|
231 public:
|
Chris@38
|
232 Cache(); // of size zero, call resize() before using
|
Chris@31
|
233 ~Cache();
|
Chris@31
|
234
|
Chris@38
|
235 size_t getWidth() const { return m_width; }
|
Chris@38
|
236 size_t getHeight() const { return m_height; }
|
Chris@38
|
237
|
Chris@38
|
238 void resize(size_t width, size_t height);
|
Chris@38
|
239 void reset(); // zero-fill or 1-fill as appropriate without changing size
|
Chris@38
|
240
|
Chris@38
|
241 float getMagnitudeAt(size_t x, size_t y) const {
|
Chris@38
|
242 return getNormalizedMagnitudeAt(x, y) * m_factor[x];
|
Chris@38
|
243 }
|
Chris@35
|
244
|
Chris@38
|
245 float getNormalizedMagnitudeAt(size_t x, size_t y) const {
|
Chris@44
|
246 return float(m_magnitude[x][y]) / 65535.0;
|
Chris@38
|
247 }
|
Chris@31
|
248
|
Chris@38
|
249 float getPhaseAt(size_t x, size_t y) const {
|
Chris@44
|
250 int16_t i = (int16_t)m_phase[x][y];
|
Chris@39
|
251 return (float(i) / 32767.0) * M_PI;
|
Chris@38
|
252 }
|
Chris@31
|
253
|
Chris@38
|
254 bool isLocalPeak(size_t x, size_t y) const {
|
Chris@44
|
255 if (y > 0 && m_magnitude[x][y] < m_magnitude[x][y-1]) return false;
|
Chris@44
|
256 if (y < m_height-1 && m_magnitude[x][y] < m_magnitude[x][y+1]) return false;
|
Chris@38
|
257 return true;
|
Chris@38
|
258 }
|
Chris@31
|
259
|
Chris@38
|
260 bool isOverThreshold(size_t x, size_t y, float threshold) const {
|
Chris@38
|
261 if (threshold == 0.0) return true;
|
Chris@38
|
262 return getMagnitudeAt(x, y) > threshold;
|
Chris@38
|
263 }
|
Chris@38
|
264
|
Chris@38
|
265 void setNormalizationFactor(size_t x, float factor) {
|
Chris@41
|
266 if (x < m_width) m_factor[x] = factor;
|
Chris@38
|
267 }
|
Chris@38
|
268
|
Chris@38
|
269 void setMagnitudeAt(size_t x, size_t y, float mag) {
|
Chris@38
|
270 // norm factor must already be set
|
Chris@38
|
271 setNormalizedMagnitudeAt(x, y, mag / m_factor[x]);
|
Chris@38
|
272 }
|
Chris@38
|
273
|
Chris@38
|
274 void setNormalizedMagnitudeAt(size_t x, size_t y, float norm) {
|
Chris@41
|
275 if (x < m_width && y < m_height) {
|
Chris@44
|
276 m_magnitude[x][y] = uint16_t(norm * 65535.0);
|
Chris@41
|
277 }
|
Chris@38
|
278 }
|
Chris@38
|
279
|
Chris@38
|
280 void setPhaseAt(size_t x, size_t y, float phase) {
|
Chris@38
|
281 // phase in range -pi -> pi
|
Chris@41
|
282 if (x < m_width && y < m_height) {
|
Chris@44
|
283 m_phase[x][y] = uint16_t(int16_t((phase * 32767) / M_PI));
|
Chris@41
|
284 }
|
Chris@38
|
285 }
|
Chris@38
|
286
|
Chris@38
|
287 QColor getColour(unsigned char index) const {
|
Chris@38
|
288 return m_colours[index];
|
Chris@38
|
289 }
|
Chris@38
|
290
|
Chris@38
|
291 void setColour(unsigned char index, QColor colour) {
|
Chris@38
|
292 m_colours[index] = colour;
|
Chris@38
|
293 }
|
Chris@38
|
294
|
Chris@38
|
295 private:
|
Chris@31
|
296 size_t m_width;
|
Chris@31
|
297 size_t m_height;
|
Chris@38
|
298 uint16_t **m_magnitude;
|
Chris@38
|
299 uint16_t **m_phase;
|
Chris@38
|
300 float *m_factor;
|
Chris@31
|
301 QColor m_colours[256];
|
Chris@38
|
302
|
Chris@38
|
303 void resize(uint16_t **&, size_t, size_t);
|
Chris@31
|
304 };
|
Chris@38
|
305
|
Chris@38
|
306 enum { NO_VALUE = 0 }; // colour index for unused pixels
|
Chris@38
|
307
|
Chris@31
|
308 Cache *m_cache;
|
Chris@31
|
309 bool m_cacheInvalid;
|
Chris@31
|
310
|
Chris@0
|
311 class CacheFillThread : public QThread
|
Chris@0
|
312 {
|
Chris@0
|
313 public:
|
Chris@0
|
314 CacheFillThread(SpectrogramLayer &layer) :
|
Chris@0
|
315 m_layer(layer), m_fillExtent(0) { }
|
Chris@0
|
316
|
Chris@0
|
317 size_t getFillExtent() const { return m_fillExtent; }
|
Chris@0
|
318 size_t getFillCompletion() const { return m_fillCompletion; }
|
Chris@0
|
319 virtual void run();
|
Chris@0
|
320
|
Chris@0
|
321 protected:
|
Chris@0
|
322 SpectrogramLayer &m_layer;
|
Chris@0
|
323 size_t m_fillExtent;
|
Chris@0
|
324 size_t m_fillCompletion;
|
Chris@0
|
325 };
|
Chris@0
|
326
|
Chris@0
|
327 void fillCache();
|
Chris@0
|
328
|
Chris@0
|
329 mutable QPixmap *m_pixmapCache;
|
Chris@0
|
330 mutable bool m_pixmapCacheInvalid;
|
Chris@0
|
331 mutable long m_pixmapCacheStartFrame;
|
Chris@0
|
332 mutable size_t m_pixmapCacheZoomLevel;
|
Chris@0
|
333
|
Chris@0
|
334 QWaitCondition m_condition;
|
Chris@0
|
335 mutable QMutex m_mutex;
|
Chris@0
|
336
|
Chris@0
|
337 CacheFillThread *m_fillThread;
|
Chris@0
|
338 QTimer *m_updateTimer;
|
Chris@44
|
339 mutable size_t m_candidateFillStartFrame;
|
Chris@0
|
340 size_t m_lastFillExtent;
|
Chris@0
|
341 bool m_exiting;
|
Chris@0
|
342
|
Chris@0
|
343 void setCacheColourmap();
|
Chris@9
|
344 void rotateCacheColourmap(int distance);
|
Chris@0
|
345
|
Chris@38
|
346 void fillCacheColumn(int column,
|
Chris@0
|
347 double *inputBuffer,
|
Chris@0
|
348 fftw_complex *outputBuffer,
|
Chris@0
|
349 fftw_plan plan,
|
Chris@9
|
350 size_t windowSize,
|
Chris@9
|
351 size_t windowIncrement,
|
Chris@38
|
352 const Window<double> &windower)
|
Chris@0
|
353 const;
|
Chris@0
|
354
|
Chris@38
|
355 static float calculateFrequency(size_t bin,
|
Chris@38
|
356 size_t windowSize,
|
Chris@38
|
357 size_t windowIncrement,
|
Chris@38
|
358 size_t sampleRate,
|
Chris@38
|
359 float previousPhase,
|
Chris@38
|
360 float currentPhase,
|
Chris@38
|
361 bool &steadyState);
|
Chris@38
|
362
|
Chris@38
|
363 unsigned char getDisplayValue(float input) const;
|
Chris@40
|
364 float getInputForDisplayValue(unsigned char uc) const;
|
Chris@40
|
365
|
Chris@40
|
366 int getColourScaleWidth(QPainter &) const;
|
Chris@40
|
367
|
Chris@40
|
368 float getEffectiveMinFrequency() const;
|
Chris@40
|
369 float getEffectiveMaxFrequency() const;
|
Chris@38
|
370
|
Chris@0
|
371 struct LayerRange {
|
Chris@0
|
372 long startFrame;
|
Chris@0
|
373 int zoomLevel;
|
Chris@0
|
374 size_t modelStart;
|
Chris@0
|
375 size_t modelEnd;
|
Chris@0
|
376 };
|
Chris@44
|
377 bool getXBinRange(View *v, int x, float &windowMin, float &windowMax) const;
|
Chris@44
|
378 bool getYBinRange(View *v, int y, float &freqBinMin, float &freqBinMax) const;
|
Chris@0
|
379
|
Chris@44
|
380 bool getYBinSourceRange(View *v, int y, float &freqMin, float &freqMax) const;
|
Chris@44
|
381 bool getAdjustedYBinSourceRange(View *v, int x, int y,
|
Chris@35
|
382 float &freqMin, float &freqMax,
|
Chris@35
|
383 float &adjFreqMin, float &adjFreqMax) const;
|
Chris@44
|
384 bool getXBinSourceRange(View *v, int x, RealTime &timeMin, RealTime &timeMax) const;
|
Chris@44
|
385 bool getXYBinSourceRange(View *v, int x, int y, float &min, float &max,
|
Chris@38
|
386 float &phaseMin, float &phaseMax) const;
|
Chris@0
|
387
|
Chris@0
|
388 size_t getWindowIncrement() const {
|
Chris@0
|
389 return m_windowSize - m_windowSize * m_windowOverlap / 100;
|
Chris@0
|
390 }
|
Chris@0
|
391 };
|
Chris@0
|
392
|
Chris@0
|
393 #endif
|