cannam@0
|
1 /* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */
|
cannam@0
|
2
|
cannam@0
|
3 /*
|
cannam@0
|
4 Vamp
|
cannam@0
|
5
|
cannam@0
|
6 An API for audio analysis and feature extraction plugins.
|
cannam@0
|
7
|
cannam@0
|
8 Centre for Digital Music, Queen Mary, University of London.
|
cannam@0
|
9 Copyright 2006 Chris Cannam.
|
cannam@0
|
10
|
cannam@0
|
11 Permission is hereby granted, free of charge, to any person
|
cannam@0
|
12 obtaining a copy of this software and associated documentation
|
cannam@0
|
13 files (the "Software"), to deal in the Software without
|
cannam@0
|
14 restriction, including without limitation the rights to use, copy,
|
cannam@0
|
15 modify, merge, publish, distribute, sublicense, and/or sell copies
|
cannam@0
|
16 of the Software, and to permit persons to whom the Software is
|
cannam@0
|
17 furnished to do so, subject to the following conditions:
|
cannam@0
|
18
|
cannam@0
|
19 The above copyright notice and this permission notice shall be
|
cannam@0
|
20 included in all copies or substantial portions of the Software.
|
cannam@0
|
21
|
cannam@0
|
22 THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
|
cannam@0
|
23 EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF
|
cannam@0
|
24 MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
|
cannam@0
|
25 NONINFRINGEMENT. IN NO EVENT SHALL THE X CONSORTIUM BE LIABLE FOR
|
cannam@0
|
26 ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF
|
cannam@0
|
27 CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION
|
cannam@0
|
28 WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
|
cannam@0
|
29
|
cannam@0
|
30 Except as contained in this notice, the names of the Centre for
|
cannam@0
|
31 Digital Music; Queen Mary, University of London; and Chris Cannam
|
cannam@0
|
32 shall not be used in advertising or otherwise to promote the sale,
|
cannam@0
|
33 use or other dealings in this Software without prior written
|
cannam@0
|
34 authorization.
|
cannam@0
|
35 */
|
cannam@0
|
36
|
cannam@0
|
37 #include "SpectralCentroid.h"
|
cannam@0
|
38
|
cannam@0
|
39 /*
|
cannam@0
|
40 #include "dsp/transforms/FFT.h"
|
cannam@0
|
41 #include "base/Window.h"
|
cannam@0
|
42 */
|
cannam@0
|
43
|
cannam@0
|
44 using std::string;
|
cannam@0
|
45 using std::vector;
|
cannam@0
|
46 using std::cerr;
|
cannam@0
|
47 using std::endl;
|
cannam@0
|
48
|
cannam@0
|
49
|
cannam@0
|
50 SpectralCentroid::SpectralCentroid(float inputSampleRate) :
|
cannam@0
|
51 Plugin(inputSampleRate),
|
cannam@0
|
52 m_stepSize(0),
|
cannam@0
|
53 m_blockSize(0),
|
cannam@0
|
54 m_workBuffer(0)
|
cannam@0
|
55 {
|
cannam@0
|
56 }
|
cannam@0
|
57
|
cannam@0
|
58 SpectralCentroid::~SpectralCentroid()
|
cannam@0
|
59 {
|
cannam@0
|
60 delete m_workBuffer;
|
cannam@0
|
61 }
|
cannam@0
|
62
|
cannam@0
|
63 string
|
cannam@0
|
64 SpectralCentroid::getName() const
|
cannam@0
|
65 {
|
cannam@0
|
66 return "spectralcentroid";
|
cannam@0
|
67 }
|
cannam@0
|
68
|
cannam@0
|
69 string
|
cannam@0
|
70 SpectralCentroid::getDescription() const
|
cannam@0
|
71 {
|
cannam@0
|
72 return "Spectral Centroid";
|
cannam@0
|
73 }
|
cannam@0
|
74
|
cannam@0
|
75 string
|
cannam@0
|
76 SpectralCentroid::getMaker() const
|
cannam@0
|
77 {
|
cannam@0
|
78 return "QMUL";
|
cannam@0
|
79 }
|
cannam@0
|
80
|
cannam@0
|
81 int
|
cannam@0
|
82 SpectralCentroid::getPluginVersion() const
|
cannam@0
|
83 {
|
cannam@0
|
84 return 2;
|
cannam@0
|
85 }
|
cannam@0
|
86
|
cannam@0
|
87 string
|
cannam@0
|
88 SpectralCentroid::getCopyright() const
|
cannam@0
|
89 {
|
cannam@0
|
90 return "GPL";
|
cannam@0
|
91 }
|
cannam@0
|
92
|
cannam@0
|
93 bool
|
cannam@0
|
94 SpectralCentroid::initialise(size_t channels, size_t stepSize, size_t blockSize)
|
cannam@0
|
95 {
|
cannam@0
|
96 if (channels < getMinChannelCount() ||
|
cannam@0
|
97 channels > getMaxChannelCount()) return false;
|
cannam@0
|
98
|
cannam@0
|
99 m_stepSize = stepSize;
|
cannam@0
|
100 m_blockSize = blockSize;
|
cannam@0
|
101
|
cannam@0
|
102 delete m_workBuffer;
|
cannam@0
|
103 m_workBuffer = new double[m_blockSize * 4];
|
cannam@0
|
104
|
cannam@0
|
105 return true;
|
cannam@0
|
106 }
|
cannam@0
|
107
|
cannam@0
|
108 void
|
cannam@0
|
109 SpectralCentroid::reset()
|
cannam@0
|
110 {
|
cannam@0
|
111 delete m_workBuffer;
|
cannam@0
|
112 m_workBuffer = new double[m_blockSize * 4];
|
cannam@0
|
113 }
|
cannam@0
|
114
|
cannam@0
|
115 size_t
|
cannam@0
|
116 SpectralCentroid::getPreferredStepSize() const
|
cannam@0
|
117 {
|
cannam@0
|
118 return 2048; // or whatever -- parameter?
|
cannam@0
|
119 }
|
cannam@0
|
120
|
cannam@0
|
121 size_t
|
cannam@0
|
122 SpectralCentroid::getPreferredBlockSize() const
|
cannam@0
|
123 {
|
cannam@0
|
124 return getPreferredStepSize();
|
cannam@0
|
125 }
|
cannam@0
|
126
|
cannam@0
|
127 SpectralCentroid::OutputList
|
cannam@0
|
128 SpectralCentroid::getOutputDescriptors() const
|
cannam@0
|
129 {
|
cannam@0
|
130 OutputList list;
|
cannam@0
|
131
|
cannam@0
|
132 OutputDescriptor d;
|
cannam@0
|
133 d.name = "logcentroid";
|
cannam@0
|
134 d.unit = "Hz";
|
cannam@0
|
135 d.description = "Log Frequency Centroid";
|
cannam@0
|
136 d.hasFixedValueCount = true;
|
cannam@0
|
137 d.valueCount = 1;
|
cannam@0
|
138 d.hasKnownExtents = false;
|
cannam@0
|
139 d.isQuantized = false;
|
cannam@0
|
140 d.sampleType = OutputDescriptor::OneSamplePerStep;
|
cannam@0
|
141 list.push_back(d);
|
cannam@0
|
142
|
cannam@0
|
143 d.name = "linearcentroid";
|
cannam@0
|
144 d.description = "Linear Frequency Centroid";
|
cannam@0
|
145 list.push_back(d);
|
cannam@0
|
146
|
cannam@0
|
147 return list;
|
cannam@0
|
148 }
|
cannam@0
|
149
|
cannam@0
|
150 SpectralCentroid::FeatureSet
|
cannam@0
|
151 SpectralCentroid::process(float **inputBuffers, Vamp::RealTime)
|
cannam@0
|
152 {
|
cannam@0
|
153 if (m_stepSize == 0) {
|
cannam@0
|
154 cerr << "ERROR: SpectralCentroid::process: "
|
cannam@0
|
155 << "SpectralCentroid has not been initialised"
|
cannam@0
|
156 << endl;
|
cannam@0
|
157 return FeatureSet();
|
cannam@0
|
158 }
|
cannam@0
|
159
|
cannam@0
|
160 /*
|
cannam@0
|
161 for (size_t i = 0; i < m_blockSize; ++i) {
|
cannam@0
|
162 m_workBuffer[i] = inputBuffers[0][i];
|
cannam@0
|
163 m_workBuffer[i + m_blockSize] = 0.0;
|
cannam@0
|
164 }
|
cannam@0
|
165
|
cannam@0
|
166 Window<double>(HanningWindow, m_blockSize).cut(m_workBuffer);
|
cannam@0
|
167
|
cannam@0
|
168 FFT::process(m_blockSize, false,
|
cannam@0
|
169 m_workBuffer,
|
cannam@0
|
170 m_workBuffer + m_blockSize,
|
cannam@0
|
171 m_workBuffer + m_blockSize*2,
|
cannam@0
|
172 m_workBuffer + m_blockSize*3);
|
cannam@0
|
173 */
|
cannam@0
|
174
|
cannam@0
|
175 double numLin = 0.0, numLog = 0.0, denom = 0.0;
|
cannam@0
|
176
|
cannam@0
|
177 for (size_t i = 1; i < m_blockSize/2; ++i) {
|
cannam@0
|
178 double freq = (double(i) * m_inputSampleRate) / m_blockSize;
|
cannam@0
|
179 double real = inputBuffers[0][i*2];
|
cannam@0
|
180 double imag = inputBuffers[0][i*2 + 1];
|
cannam@0
|
181 double power = sqrt(real * real + imag * imag) / (m_blockSize/2);
|
cannam@0
|
182 numLin += freq * power;
|
cannam@0
|
183 numLog += log10f(freq) * power;
|
cannam@0
|
184 denom += power;
|
cannam@0
|
185 }
|
cannam@0
|
186
|
cannam@0
|
187 FeatureSet returnFeatures;
|
cannam@0
|
188
|
cannam@0
|
189 std::cerr << "power " << denom << ", block size " << m_blockSize << std::endl;
|
cannam@0
|
190
|
cannam@0
|
191 if (denom != 0.0) {
|
cannam@0
|
192 float centroidLin = float(numLin / denom);
|
cannam@0
|
193 float centroidLog = exp10f(float(numLog / denom));
|
cannam@0
|
194 Feature feature;
|
cannam@0
|
195 feature.hasTimestamp = false;
|
cannam@0
|
196 feature.values.push_back(centroidLog);
|
cannam@0
|
197 returnFeatures[0].push_back(feature);
|
cannam@0
|
198 feature.values.clear();
|
cannam@0
|
199 feature.values.push_back(centroidLin);
|
cannam@0
|
200 returnFeatures[1].push_back(feature);
|
cannam@0
|
201 }
|
cannam@0
|
202
|
cannam@0
|
203 return returnFeatures;
|
cannam@0
|
204 }
|
cannam@0
|
205
|
cannam@0
|
206 SpectralCentroid::FeatureSet
|
cannam@0
|
207 SpectralCentroid::getRemainingFeatures()
|
cannam@0
|
208 {
|
cannam@0
|
209 return FeatureSet();
|
cannam@0
|
210 }
|
cannam@0
|
211
|