annotate NNLSChroma.cpp @ 119:c4d1208e5ea9 monophonicness

tidying up a bit
author Matthias Mauch <mail@matthiasmauch.net>
date Thu, 31 Mar 2011 14:59:11 +0100
parents 5f3d3ea6aab6
children 7a8956e903e1
rev   line source
Chris@23 1 /* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */
matthiasm@0 2
Chris@35 3 /*
Chris@35 4 NNLS-Chroma / Chordino
Chris@35 5
Chris@35 6 Audio feature extraction plugins for chromagram and chord
Chris@35 7 estimation.
Chris@35 8
Chris@35 9 Centre for Digital Music, Queen Mary University of London.
Chris@35 10 This file copyright 2008-2010 Matthias Mauch and QMUL.
Chris@35 11
Chris@35 12 This program is free software; you can redistribute it and/or
Chris@35 13 modify it under the terms of the GNU General Public License as
Chris@35 14 published by the Free Software Foundation; either version 2 of the
Chris@35 15 License, or (at your option) any later version. See the file
Chris@35 16 COPYING included with this distribution for more information.
Chris@35 17 */
Chris@35 18
matthiasm@0 19 #include "NNLSChroma.h"
Chris@27 20
Chris@27 21 #include "chromamethods.h"
Chris@27 22
Chris@27 23 #include <cstdlib>
Chris@27 24 #include <fstream>
matthiasm@0 25 #include <cmath>
matthiasm@9 26
Chris@27 27 #include <algorithm>
matthiasm@0 28
matthiasm@0 29 const bool debug_on = false;
matthiasm@0 30
matthiasm@0 31 NNLSChroma::NNLSChroma(float inputSampleRate) :
Chris@35 32 NNLSBase(inputSampleRate)
matthiasm@0 33 {
Chris@23 34 if (debug_on) cerr << "--> NNLSChroma" << endl;
matthiasm@0 35 }
matthiasm@0 36
matthiasm@0 37 NNLSChroma::~NNLSChroma()
matthiasm@0 38 {
Chris@23 39 if (debug_on) cerr << "--> ~NNLSChroma" << endl;
matthiasm@0 40 }
matthiasm@0 41
matthiasm@0 42 string
matthiasm@0 43 NNLSChroma::getIdentifier() const
matthiasm@0 44 {
Chris@23 45 if (debug_on) cerr << "--> getIdentifier" << endl;
matthiasm@46 46 return "nnls-chroma";
matthiasm@0 47 }
matthiasm@0 48
matthiasm@0 49 string
matthiasm@0 50 NNLSChroma::getName() const
matthiasm@0 51 {
Chris@23 52 if (debug_on) cerr << "--> getName" << endl;
matthiasm@0 53 return "NNLS Chroma";
matthiasm@0 54 }
matthiasm@0 55
matthiasm@0 56 string
matthiasm@0 57 NNLSChroma::getDescription() const
matthiasm@0 58 {
Chris@23 59 if (debug_on) cerr << "--> getDescription" << endl;
matthiasm@58 60 return "This plugin provides a number of features derived from a DFT-based log-frequency amplitude spectrum: some variants of the log-frequency spectrum, including a semitone spectrum derived from approximate transcription using the NNLS algorithm; and based on this semitone spectrum, different chroma features.";
matthiasm@0 61 }
matthiasm@0 62
matthiasm@0 63 NNLSChroma::OutputList
matthiasm@0 64 NNLSChroma::getOutputDescriptors() const
matthiasm@0 65 {
Chris@23 66 if (debug_on) cerr << "--> getOutputDescriptors" << endl;
matthiasm@0 67 OutputList list;
matthiasm@0 68
matthiasm@0 69 // Make chroma names for the binNames property
matthiasm@0 70 vector<string> chromanames;
matthiasm@0 71 vector<string> bothchromanames;
matthiasm@0 72 for (int iNote = 0; iNote < 24; iNote++) {
matthiasm@0 73 bothchromanames.push_back(notenames[iNote]);
matthiasm@0 74 if (iNote < 12) {
matthiasm@43 75 chromanames.push_back(notenames[iNote+12]);
matthiasm@0 76 }
matthiasm@0 77 }
matthiasm@0 78
Chris@35 79 int index = 0;
matthiasm@0 80
mail@117 81 OutputDescriptor logfreqspecOutput;
mail@117 82 logfreqspecOutput.identifier = "logfreqspec";
mail@117 83 logfreqspecOutput.name = "Log-Frequency Spectrum";
mail@117 84 logfreqspecOutput.description = "A Log-Frequency Spectrum (constant Q) that is obtained by cosine filter mapping.";
mail@117 85 logfreqspecOutput.unit = "";
mail@117 86 logfreqspecOutput.hasFixedBinCount = true;
mail@117 87 logfreqspecOutput.binCount = nNote;
mail@117 88 logfreqspecOutput.hasKnownExtents = false;
mail@117 89 logfreqspecOutput.isQuantized = false;
mail@117 90 logfreqspecOutput.sampleType = OutputDescriptor::FixedSampleRate;
mail@117 91 logfreqspecOutput.hasDuration = false;
mail@117 92 logfreqspecOutput.sampleRate = (m_stepSize == 0) ? m_inputSampleRate/2048 : m_inputSampleRate/m_stepSize;
mail@117 93 list.push_back(logfreqspecOutput);
mail@117 94 m_outputLogfreqspec = index++;
matthiasm@0 95
mail@117 96 OutputDescriptor tunedlogfreqspecOutput;
mail@117 97 tunedlogfreqspecOutput.identifier = "tunedlogfreqspec";
mail@117 98 tunedlogfreqspecOutput.name = "Tuned Log-Frequency Spectrum";
mail@117 99 tunedlogfreqspecOutput.description = "A Log-Frequency Spectrum (constant Q) that is obtained by cosine filter mapping, then its tuned using the estimated tuning frequency.";
mail@117 100 tunedlogfreqspecOutput.unit = "";
mail@117 101 tunedlogfreqspecOutput.hasFixedBinCount = true;
mail@117 102 tunedlogfreqspecOutput.binCount = nNote;
mail@117 103 tunedlogfreqspecOutput.hasKnownExtents = false;
mail@117 104 tunedlogfreqspecOutput.isQuantized = false;
mail@117 105 tunedlogfreqspecOutput.sampleType = OutputDescriptor::FixedSampleRate;
mail@117 106 tunedlogfreqspecOutput.hasDuration = false;
mail@117 107 tunedlogfreqspecOutput.sampleRate = (m_stepSize == 0) ? m_inputSampleRate/2048 : m_inputSampleRate/m_stepSize;
mail@117 108 list.push_back(tunedlogfreqspecOutput);
mail@117 109 m_outputTunedlogfreqspec = index++;
matthiasm@0 110
mail@117 111 OutputDescriptor semitonespectrumOutput;
mail@117 112 semitonespectrumOutput.identifier = "semitonespectrum";
mail@117 113 semitonespectrumOutput.name = "Semitone Spectrum";
mail@117 114 semitonespectrumOutput.description = "A semitone-spaced log-frequency spectrum derived from the third-of-a-semitone-spaced tuned log-frequency spectrum.";
mail@117 115 semitonespectrumOutput.unit = "";
mail@117 116 semitonespectrumOutput.hasFixedBinCount = true;
mail@117 117 semitonespectrumOutput.binCount = 84;
mail@117 118 semitonespectrumOutput.hasKnownExtents = false;
mail@117 119 semitonespectrumOutput.isQuantized = false;
mail@117 120 semitonespectrumOutput.sampleType = OutputDescriptor::FixedSampleRate;
mail@117 121 semitonespectrumOutput.hasDuration = false;
mail@117 122 semitonespectrumOutput.sampleRate = (m_stepSize == 0) ? m_inputSampleRate/2048 : m_inputSampleRate/m_stepSize;
mail@117 123 list.push_back(semitonespectrumOutput);
mail@117 124 m_outputSemitonespectrum = index++;
matthiasm@0 125
mail@117 126 OutputDescriptor chromaOutput;
mail@117 127 chromaOutput.identifier = "chroma";
mail@117 128 chromaOutput.name = "Chromagram";
mail@117 129 chromaOutput.description = "Tuning-adjusted chromagram from NNLS approximate transcription, with an emphasis on the medium note range.";
mail@117 130 chromaOutput.unit = "";
mail@117 131 chromaOutput.hasFixedBinCount = true;
mail@117 132 chromaOutput.binCount = 12;
mail@117 133 chromaOutput.binNames = chromanames;
mail@117 134 chromaOutput.hasKnownExtents = false;
mail@117 135 chromaOutput.isQuantized = false;
mail@117 136 chromaOutput.sampleType = OutputDescriptor::FixedSampleRate;
mail@117 137 chromaOutput.hasDuration = false;
mail@117 138 chromaOutput.sampleRate = (m_stepSize == 0) ? m_inputSampleRate/2048 : m_inputSampleRate/m_stepSize;
mail@117 139 list.push_back(chromaOutput);
Chris@35 140 m_outputChroma = index++;
matthiasm@0 141
mail@116 142 OutputDescriptor basschromaOutput;
mail@116 143 basschromaOutput.identifier = "basschroma";
mail@116 144 basschromaOutput.name = "Bass Chromagram";
mail@116 145 basschromaOutput.description = "Tuning-adjusted bass chromagram from NNLS approximate transcription, with an emphasis on the bass note range.";
mail@116 146 basschromaOutput.unit = "";
mail@116 147 basschromaOutput.hasFixedBinCount = true;
mail@116 148 basschromaOutput.binCount = 12;
mail@116 149 basschromaOutput.binNames = chromanames;
mail@116 150 basschromaOutput.hasKnownExtents = false;
mail@116 151 basschromaOutput.isQuantized = false;
mail@116 152 basschromaOutput.sampleType = OutputDescriptor::FixedSampleRate;
mail@116 153 basschromaOutput.hasDuration = false;
mail@116 154 basschromaOutput.sampleRate = (m_stepSize == 0) ? m_inputSampleRate/2048 : m_inputSampleRate/m_stepSize;
mail@116 155 list.push_back(basschromaOutput);
mail@117 156 m_outputBasschroma = index++;
matthiasm@0 157
mail@116 158 OutputDescriptor bothchromaOutput;
mail@116 159 bothchromaOutput.identifier = "bothchroma";
mail@116 160 bothchromaOutput.name = "Chromagram and Bass Chromagram";
mail@116 161 bothchromaOutput.description = "Tuning-adjusted chromagram and bass chromagram (stacked on top of each other) from NNLS approximate transcription.";
mail@116 162 bothchromaOutput.unit = "";
mail@116 163 bothchromaOutput.hasFixedBinCount = true;
mail@116 164 bothchromaOutput.binCount = 24;
mail@116 165 bothchromaOutput.binNames = bothchromanames;
mail@116 166 bothchromaOutput.hasKnownExtents = false;
mail@116 167 bothchromaOutput.isQuantized = false;
mail@116 168 bothchromaOutput.sampleType = OutputDescriptor::FixedSampleRate;
mail@116 169 bothchromaOutput.hasDuration = false;
mail@116 170 bothchromaOutput.sampleRate = (m_stepSize == 0) ? m_inputSampleRate/2048 : m_inputSampleRate/m_stepSize;
mail@116 171 list.push_back(bothchromaOutput);
mail@117 172 m_outputBothchroma = index++;
matthiasm@1 173
mail@116 174 OutputDescriptor consonanceOutput;
mail@116 175 consonanceOutput.identifier = "consonance";
mail@116 176 consonanceOutput.name = "Consonance estimate.";
mail@116 177 consonanceOutput.description = "A simple consonance value based on the convolution of a consonance profile with the semitone spectrum.";
mail@116 178 consonanceOutput.unit = "";
mail@116 179 consonanceOutput.hasFixedBinCount = true;
mail@116 180 consonanceOutput.binCount = 1;
mail@116 181 consonanceOutput.hasKnownExtents = false;
mail@116 182 consonanceOutput.isQuantized = false;
mail@116 183 consonanceOutput.sampleType = OutputDescriptor::FixedSampleRate;
mail@116 184 consonanceOutput.hasDuration = false;
mail@116 185 consonanceOutput.sampleRate = (m_stepSize == 0) ? m_inputSampleRate/2048 : m_inputSampleRate/m_stepSize;
mail@116 186 list.push_back(consonanceOutput);
mail@83 187 m_outputConsonance = index++;
mail@83 188
mail@116 189 OutputDescriptor monophonicnessOutput;
mail@116 190 monophonicnessOutput.identifier = "monophonicness";
mail@116 191 monophonicnessOutput.name = "Monophonicness estimate.";
mail@116 192 monophonicnessOutput.description = ".";
mail@116 193 monophonicnessOutput.unit = "";
mail@116 194 monophonicnessOutput.hasFixedBinCount = true;
mail@116 195 monophonicnessOutput.binCount = 1;
mail@116 196 monophonicnessOutput.hasKnownExtents = true;
mail@116 197 monophonicnessOutput.minValue = 0;
mail@116 198 monophonicnessOutput.maxValue = 1;
mail@116 199 monophonicnessOutput.isQuantized = false;
mail@116 200 monophonicnessOutput.sampleType = OutputDescriptor::FixedSampleRate;
mail@116 201 monophonicnessOutput.hasDuration = false;
mail@116 202 monophonicnessOutput.sampleRate = (m_stepSize == 0) ? m_inputSampleRate/2048 : m_inputSampleRate/m_stepSize;
mail@116 203 list.push_back(monophonicnessOutput);
matthiasm@105 204 m_outputMonophonicness = index++;
matthiasm@105 205
matthiasm@0 206 return list;
matthiasm@0 207 }
matthiasm@0 208
matthiasm@0 209
matthiasm@0 210 bool
matthiasm@0 211 NNLSChroma::initialise(size_t channels, size_t stepSize, size_t blockSize)
matthiasm@0 212 {
Chris@23 213 if (debug_on) {
Chris@23 214 cerr << "--> initialise";
Chris@23 215 }
matthiasm@1 216
Chris@35 217 if (!NNLSBase::initialise(channels, stepSize, blockSize)) {
Chris@35 218 return false;
Chris@35 219 }
matthiasm@1 220
matthiasm@0 221 return true;
matthiasm@0 222 }
matthiasm@0 223
matthiasm@0 224 void
matthiasm@0 225 NNLSChroma::reset()
matthiasm@0 226 {
Chris@23 227 if (debug_on) cerr << "--> reset";
Chris@35 228 NNLSBase::reset();
matthiasm@0 229 }
matthiasm@0 230
matthiasm@0 231 NNLSChroma::FeatureSet
matthiasm@0 232 NNLSChroma::process(const float *const *inputBuffers, Vamp::RealTime timestamp)
matthiasm@0 233 {
Chris@23 234 if (debug_on) cerr << "--> process" << endl;
Chris@35 235
Chris@35 236 NNLSBase::baseProcess(inputBuffers, timestamp);
matthiasm@0 237
Chris@23 238 FeatureSet fs;
mail@117 239 fs[m_outputLogfreqspec].push_back(m_logSpectrum[m_logSpectrum.size()-1]);
Chris@23 240 return fs;
matthiasm@0 241 }
matthiasm@0 242
matthiasm@0 243 NNLSChroma::FeatureSet
matthiasm@0 244 NNLSChroma::getRemainingFeatures()
matthiasm@0 245 {
mail@100 246 static const int nConsonance = 24;
mail@100 247 float consonancepattern[nConsonance] = {0,-1,-1,1,1,1,-1,1,1,1,-1,-1,1,-1,-1,1,1,1,-1,1,1,1,-1,-1};
mail@100 248 float consonancemean = 0;
mail@100 249 for (int i = 0; i< nConsonance; ++i) {
mail@100 250 consonancemean += consonancepattern[i]/nConsonance;
mail@100 251 }
mail@84 252
mail@100 253 for (int i = 0; i< nConsonance; ++i) {
mail@100 254 consonancepattern[i] -= consonancemean;
mail@100 255 }
mail@119 256
mail@119 257 if (debug_on) cerr << "--> getRemainingFeatures" << endl;
Chris@23 258 FeatureSet fsOut;
Chris@35 259 if (m_logSpectrum.size() == 0) return fsOut;
mail@119 260
Chris@23 261 /** Calculate Tuning
Chris@23 262 calculate tuning from (using the angle of the complex number defined by the
Chris@23 263 cumulative mean real and imag values)
Chris@23 264 **/
mail@80 265 float meanTuningImag = 0;
mail@80 266 float meanTuningReal = 0;
mail@80 267 for (int iBPS = 0; iBPS < nBPS; ++iBPS) {
mail@80 268 meanTuningReal += m_meanTunings[iBPS] * cosvalues[iBPS];
mail@80 269 meanTuningImag += m_meanTunings[iBPS] * sinvalues[iBPS];
mail@80 270 }
Chris@23 271 float cumulativetuning = 440 * pow(2,atan2(meanTuningImag, meanTuningReal)/(24*M_PI));
Chris@23 272 float normalisedtuning = atan2(meanTuningImag, meanTuningReal)/(2*M_PI);
Chris@23 273 int intShift = floor(normalisedtuning * 3);
mail@80 274 float floatShift = normalisedtuning * 3 - intShift; // floatShift is a really bad name for this
matthiasm@1 275
Chris@23 276 char buffer0 [50];
matthiasm@1 277
Chris@23 278 sprintf(buffer0, "estimated tuning: %0.1f Hz", cumulativetuning);
mail@119 279
Chris@23 280 /** Tune Log-Frequency Spectrogram
Chris@23 281 calculate a tuned log-frequency spectrogram (f2): use the tuning estimated above (kinda f0) to
Chris@23 282 perform linear interpolation on the existing log-frequency spectrogram (kinda f1).
Chris@23 283 **/
Chris@23 284 cerr << endl << "[NNLS Chroma Plugin] Tuning Log-Frequency Spectrogram ... ";
matthiasm@13 285
Chris@23 286 float tempValue = 0;
Chris@23 287 float dbThreshold = 0; // relative to the background spectrum
Chris@23 288 float thresh = pow(10,dbThreshold/20);
Chris@23 289 int count = 0;
mail@77 290
matthiasm@1 291
Chris@35 292 for (FeatureList::iterator i = m_logSpectrum.begin(); i != m_logSpectrum.end(); ++i) {
Chris@23 293 Feature f1 = *i;
Chris@23 294 Feature f2; // tuned log-frequency spectrum
Chris@23 295 f2.hasTimestamp = true;
Chris@23 296 f2.timestamp = f1.timestamp;
Chris@23 297 f2.values.push_back(0.0); f2.values.push_back(0.0); // set lower edge to zero
matthiasm@1 298
matthiasm@85 299
Chris@23 300 if (m_tuneLocal) {
Chris@23 301 intShift = floor(m_localTuning[count] * 3);
mail@80 302 floatShift = m_localTuning[count] * 3 - intShift; // floatShift is a really bad name for this
Chris@23 303 }
matthiasm@1 304
mail@80 305 // cerr << intShift << " " << floatShift << endl;
matthiasm@1 306
Chris@23 307 for (unsigned k = 2; k < f1.values.size() - 3; ++k) { // interpolate all inner bins
mail@80 308 tempValue = f1.values[k + intShift] * (1-floatShift) + f1.values[k+intShift+1] * floatShift;
Chris@23 309 f2.values.push_back(tempValue);
Chris@23 310 }
matthiasm@1 311
Chris@23 312 f2.values.push_back(0.0); f2.values.push_back(0.0); f2.values.push_back(0.0); // upper edge
mail@77 313
Chris@23 314 vector<float> runningmean = SpecialConvolution(f2.values,hw);
Chris@23 315 vector<float> runningstd;
mail@77 316 for (int i = 0; i < nNote; i++) { // first step: squared values into vector (variance)
Chris@23 317 runningstd.push_back((f2.values[i] - runningmean[i]) * (f2.values[i] - runningmean[i]));
Chris@23 318 }
Chris@23 319 runningstd = SpecialConvolution(runningstd,hw); // second step convolve
mail@77 320 for (int i = 0; i < nNote; i++) {
Chris@23 321 runningstd[i] = sqrt(runningstd[i]); // square root to finally have running std
Chris@23 322 if (runningstd[i] > 0) {
Chris@23 323 // f2.values[i] = (f2.values[i] / runningmean[i]) > thresh ?
mail@41 324 // (f2.values[i] - runningmean[i]) / pow(runningstd[i],m_whitening) : 0;
Chris@23 325 f2.values[i] = (f2.values[i] - runningmean[i]) > 0 ?
mail@41 326 (f2.values[i] - runningmean[i]) / pow(runningstd[i],m_whitening) : 0;
Chris@23 327 }
Chris@23 328 if (f2.values[i] < 0) {
Chris@23 329 cerr << "ERROR: negative value in logfreq spectrum" << endl;
Chris@23 330 }
Chris@23 331 }
mail@117 332 fsOut[m_outputTunedlogfreqspec].push_back(f2);
Chris@23 333 count++;
Chris@23 334 }
Chris@23 335 cerr << "done." << endl;
matthiasm@1 336
Chris@23 337 /** Semitone spectrum and chromagrams
Chris@23 338 Semitone-spaced log-frequency spectrum derived from the tuned log-freq spectrum above. the spectrum
Chris@23 339 is inferred using a non-negative least squares algorithm.
Chris@23 340 Three different kinds of chromagram are calculated, "treble", "bass", and "both" (which means
Chris@23 341 bass and treble stacked onto each other).
Chris@23 342 **/
matthiasm@42 343 if (m_useNNLS == 0) {
Chris@23 344 cerr << "[NNLS Chroma Plugin] Mapping to semitone spectrum and chroma ... ";
Chris@23 345 } else {
Chris@23 346 cerr << "[NNLS Chroma Plugin] Performing NNLS and mapping to chroma ... ";
Chris@23 347 }
matthiasm@13 348
matthiasm@1 349
Chris@23 350 vector<float> oldchroma = vector<float>(12,0);
Chris@23 351 vector<float> oldbasschroma = vector<float>(12,0);
Chris@23 352 count = 0;
matthiasm@9 353
mail@117 354 for (FeatureList::iterator it = fsOut[m_outputTunedlogfreqspec].begin(); it != fsOut[m_outputTunedlogfreqspec].end(); ++it) {
Chris@23 355 Feature f2 = *it; // logfreq spectrum
Chris@23 356 Feature f3; // semitone spectrum
Chris@23 357 Feature f4; // treble chromagram
Chris@23 358 Feature f5; // bass chromagram
Chris@23 359 Feature f6; // treble and bass chromagram
matthiasm@85 360 Feature consonance;
matthiasm@105 361 Feature monophonicness;
matthiasm@85 362
Chris@23 363 f3.hasTimestamp = true;
Chris@23 364 f3.timestamp = f2.timestamp;
matthiasm@1 365
Chris@23 366 f4.hasTimestamp = true;
Chris@23 367 f4.timestamp = f2.timestamp;
matthiasm@1 368
Chris@23 369 f5.hasTimestamp = true;
Chris@23 370 f5.timestamp = f2.timestamp;
matthiasm@1 371
Chris@23 372 f6.hasTimestamp = true;
Chris@23 373 f6.timestamp = f2.timestamp;
matthiasm@1 374
matthiasm@85 375 consonance.hasTimestamp = true;
matthiasm@85 376 consonance.timestamp = f2.timestamp;
matthiasm@105 377
matthiasm@105 378 monophonicness.hasTimestamp = true;
matthiasm@105 379 monophonicness.timestamp = f2.timestamp;
matthiasm@85 380
mail@77 381 float b[nNote];
matthiasm@1 382
Chris@23 383 bool some_b_greater_zero = false;
Chris@23 384 float sumb = 0;
mail@77 385 for (int i = 0; i < nNote; i++) {
mail@77 386 // b[i] = m_dict[(nNote * count + i) % (nNote * 84)];
Chris@23 387 b[i] = f2.values[i];
Chris@23 388 sumb += b[i];
Chris@23 389 if (b[i] > 0) {
Chris@23 390 some_b_greater_zero = true;
Chris@23 391 }
Chris@23 392 }
matthiasm@1 393
Chris@23 394 // here's where the non-negative least squares algorithm calculates the note activation x
matthiasm@1 395
Chris@23 396 vector<float> chroma = vector<float>(12, 0);
Chris@23 397 vector<float> basschroma = vector<float>(12, 0);
Chris@23 398 float currval;
Chris@23 399 unsigned iSemitone = 0;
matthiasm@1 400
Chris@23 401 if (some_b_greater_zero) {
matthiasm@42 402 if (m_useNNLS == 0) {
mail@80 403 for (unsigned iNote = nBPS/2 + 2; iNote < nNote - nBPS/2; iNote += nBPS) {
Chris@23 404 currval = 0;
mail@80 405 for (int iBPS = -nBPS/2; iBPS < nBPS/2+1; ++iBPS) {
mail@80 406 currval += b[iNote + iBPS] * (1-abs(iBPS*1.0/(nBPS/2+1)));
mail@80 407 }
Chris@23 408 f3.values.push_back(currval);
Chris@23 409 chroma[iSemitone % 12] += currval * treblewindow[iSemitone];
Chris@23 410 basschroma[iSemitone % 12] += currval * basswindow[iSemitone];
Chris@23 411 iSemitone++;
Chris@23 412 }
matthiasm@1 413
Chris@23 414 } else {
Chris@35 415 float x[84+1000];
Chris@23 416 for (int i = 1; i < 1084; ++i) x[i] = 1.0;
Chris@23 417 vector<int> signifIndex;
Chris@23 418 int index=0;
Chris@23 419 sumb /= 84.0;
mail@80 420 for (unsigned iNote = nBPS/2 + 2; iNote < nNote - nBPS/2; iNote += nBPS) {
Chris@23 421 float currval = 0;
mail@80 422 for (int iBPS = -nBPS/2; iBPS < nBPS/2+1; ++iBPS) {
mail@80 423 currval += b[iNote + iBPS];
mail@80 424 }
Chris@23 425 if (currval > 0) signifIndex.push_back(index);
Chris@23 426 f3.values.push_back(0); // fill the values, change later
Chris@23 427 index++;
Chris@23 428 }
Chris@35 429 float rnorm;
Chris@35 430 float w[84+1000];
Chris@35 431 float zz[84+1000];
Chris@23 432 int indx[84+1000];
Chris@23 433 int mode;
mail@77 434 int dictsize = nNote*signifIndex.size();
Chris@23 435 // cerr << "dictsize is " << dictsize << "and values size" << f3.values.size()<< endl;
Chris@35 436 float *curr_dict = new float[dictsize];
Chris@91 437 for (int iNote = 0; iNote < (int)signifIndex.size(); ++iNote) {
Chris@91 438 for (int iBin = 0; iBin < nNote; iBin++) {
mail@77 439 curr_dict[iNote * nNote + iBin] = 1.0 * m_dict[signifIndex[iNote] * nNote + iBin];
Chris@23 440 }
Chris@23 441 }
Chris@35 442 nnls(curr_dict, nNote, nNote, signifIndex.size(), b, x, &rnorm, w, zz, indx, &mode);
Chris@23 443 delete [] curr_dict;
Chris@91 444 for (int iNote = 0; iNote < (int)signifIndex.size(); ++iNote) {
Chris@23 445 f3.values[signifIndex[iNote]] = x[iNote];
Chris@23 446 // cerr << mode << endl;
Chris@23 447 chroma[signifIndex[iNote] % 12] += x[iNote] * treblewindow[signifIndex[iNote]];
Chris@23 448 basschroma[signifIndex[iNote] % 12] += x[iNote] * basswindow[signifIndex[iNote]];
Chris@23 449 }
Chris@23 450 }
matthiasm@79 451 } else {
matthiasm@79 452 for (int i = 0; i < 84; ++i) f3.values.push_back(0);
Chris@23 453 }
matthiasm@85 454
matthiasm@85 455 float notesum = 0;
matthiasm@85 456
matthiasm@85 457 consonance.values.push_back(0);
matthiasm@104 458
matthiasm@105 459 float note_max = 0;
matthiasm@105 460 float note_runnerup = 0;
matthiasm@105 461 // float note_sum = 0;
matthiasm@105 462 for (int iSemitone = 0; iSemitone < 84; iSemitone++) {
matthiasm@105 463 float currvalue = f3.values[iSemitone] * treblewindow[iSemitone];
matthiasm@105 464 if (currvalue > note_max) {
matthiasm@105 465 note_runnerup = note_max;
matthiasm@105 466 note_max = currvalue;
matthiasm@105 467 } else if (currvalue > note_runnerup) {
matthiasm@105 468 note_runnerup = currvalue;
matthiasm@105 469 }
matthiasm@105 470 // note_sum += note[iPitchClass];
matthiasm@105 471 }
matthiasm@105 472 // float note_monophonicness = 12*note_max/(12*note_max+note_sum);
mail@111 473 // cerr << note_max << endl;
mail@111 474 // cerr << note_runnerup << endl << endl;
matthiasm@105 475 float note_monophonicness = 0.5;
matthiasm@105 476 if (note_max > 0) {
matthiasm@105 477 note_monophonicness = (note_max / (note_max+note_runnerup) - 0.5) * 2;
matthiasm@105 478 }
matthiasm@105 479 monophonicness.values.push_back(note_monophonicness);
matthiasm@105 480
matthiasm@104 481 for (int iSemitone = 0; iSemitone < 84; ++iSemitone) {
matthiasm@104 482 float tempconsonance = 0;
matthiasm@104 483 int sumlength = 1;
matthiasm@85 484 for (int jSemitone = 1; jSemitone < 24; ++jSemitone) {
matthiasm@104 485 if (iSemitone+jSemitone > 84-1) break;
matthiasm@104 486 sumlength++;
mail@100 487 tempconsonance += f3.values[iSemitone+jSemitone] * (consonancepattern[jSemitone]) * treblewindow[iSemitone+jSemitone];
matthiasm@85 488 }
matthiasm@104 489 notesum += f3.values[iSemitone] * f3.values[iSemitone] * treblewindow[iSemitone] * treblewindow[iSemitone] * sumlength;
matthiasm@104 490 consonance.values[0] += (f3.values[iSemitone] * tempconsonance * treblewindow[iSemitone]) * sumlength;
matthiasm@85 491 }
matthiasm@104 492 // cerr << consonance.values[0] << " " << f3.timestamp << " "<< notesum << endl;
matthiasm@86 493 if (notesum > 0) consonance.values[0] /= notesum;
matthiasm@104 494
matthiasm@85 495
Chris@23 496 f4.values = chroma;
Chris@23 497 f5.values = basschroma;
Chris@23 498 chroma.insert(chroma.begin(), basschroma.begin(), basschroma.end()); // just stack the both chromas
Chris@23 499 f6.values = chroma;
matthiasm@1 500
Chris@23 501 if (m_doNormalizeChroma > 0) {
Chris@23 502 vector<float> chromanorm = vector<float>(3,0);
Chris@23 503 switch (int(m_doNormalizeChroma)) {
Chris@23 504 case 0: // should never end up here
Chris@23 505 break;
Chris@23 506 case 1:
Chris@23 507 chromanorm[0] = *max_element(f4.values.begin(), f4.values.end());
Chris@23 508 chromanorm[1] = *max_element(f5.values.begin(), f5.values.end());
Chris@23 509 chromanorm[2] = max(chromanorm[0], chromanorm[1]);
Chris@23 510 break;
Chris@23 511 case 2:
Chris@23 512 for (vector<float>::iterator it = f4.values.begin(); it != f4.values.end(); ++it) {
Chris@23 513 chromanorm[0] += *it;
Chris@23 514 }
Chris@23 515 for (vector<float>::iterator it = f5.values.begin(); it != f5.values.end(); ++it) {
Chris@23 516 chromanorm[1] += *it;
Chris@23 517 }
Chris@23 518 for (vector<float>::iterator it = f6.values.begin(); it != f6.values.end(); ++it) {
Chris@23 519 chromanorm[2] += *it;
Chris@23 520 }
Chris@23 521 break;
Chris@23 522 case 3:
Chris@23 523 for (vector<float>::iterator it = f4.values.begin(); it != f4.values.end(); ++it) {
Chris@23 524 chromanorm[0] += pow(*it,2);
Chris@23 525 }
Chris@23 526 chromanorm[0] = sqrt(chromanorm[0]);
Chris@23 527 for (vector<float>::iterator it = f5.values.begin(); it != f5.values.end(); ++it) {
Chris@23 528 chromanorm[1] += pow(*it,2);
Chris@23 529 }
Chris@23 530 chromanorm[1] = sqrt(chromanorm[1]);
Chris@23 531 for (vector<float>::iterator it = f6.values.begin(); it != f6.values.end(); ++it) {
Chris@23 532 chromanorm[2] += pow(*it,2);
Chris@23 533 }
Chris@23 534 chromanorm[2] = sqrt(chromanorm[2]);
Chris@23 535 break;
Chris@23 536 }
Chris@23 537 if (chromanorm[0] > 0) {
Chris@91 538 for (size_t i = 0; i < f4.values.size(); i++) {
Chris@23 539 f4.values[i] /= chromanorm[0];
Chris@23 540 }
Chris@23 541 }
Chris@23 542 if (chromanorm[1] > 0) {
Chris@91 543 for (size_t i = 0; i < f5.values.size(); i++) {
Chris@23 544 f5.values[i] /= chromanorm[1];
Chris@23 545 }
Chris@23 546 }
Chris@23 547 if (chromanorm[2] > 0) {
Chris@91 548 for (size_t i = 0; i < f6.values.size(); i++) {
Chris@23 549 f6.values[i] /= chromanorm[2];
Chris@23 550 }
Chris@23 551 }
Chris@23 552 }
matthiasm@13 553
mail@117 554 fsOut[m_outputSemitonespectrum].push_back(f3);
Chris@35 555 fsOut[m_outputChroma].push_back(f4);
mail@117 556 fsOut[m_outputBasschroma].push_back(f5);
mail@117 557 fsOut[m_outputBothchroma].push_back(f6);
matthiasm@85 558 fsOut[m_outputConsonance].push_back(consonance);
matthiasm@105 559 fsOut[m_outputMonophonicness].push_back(monophonicness);
Chris@23 560 count++;
Chris@23 561 }
Chris@23 562 cerr << "done." << endl;
matthiasm@10 563
Chris@23 564 return fsOut;
matthiasm@0 565
matthiasm@0 566 }
matthiasm@0 567