annotate dsp/keydetection/GetKeyMode.cpp @ 43:b4921bfd2aea

* remove exceptions from Polyfit, return bool instead of int from isModeMinor
author cannam
date Thu, 07 Feb 2008 10:01:38 +0000
parents 163f6e03e9e7
children 38bf09927942
rev   line source
cannam@34 1 /* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */
cannam@34 2
cannam@7 3 // GetKeyMode.cpp: implementation of the CGetKeyMode class.
cannam@7 4 //
cannam@7 5 //////////////////////////////////////////////////////////////////////
cannam@7 6
cannam@7 7 #include "GetKeyMode.h"
cannam@16 8 #include "maths/MathUtilities.h"
cannam@9 9 #include "base/Pitch.h"
cannam@9 10
cannam@9 11 #include <iostream>
cannam@7 12
cannam@7 13 // Chords profile
cannam@7 14 static double MajProfile[36] =
cannam@7 15 { 0.0384, 0.0629, 0.0258, 0.0121, 0.0146, 0.0106, 0.0364, 0.0610, 0.0267,
chriss@15 16 0.0126, 0.0121, 0.0086, 0.0364, 0.0623, 0.0279, 0.0275, 0.0414, 0.0186,
cannam@7 17 0.0173, 0.0248, 0.0145, 0.0364, 0.0631, 0.0262, 0.0129, 0.0150, 0.0098,
cannam@7 18 0.0312, 0.0521, 0.0235, 0.0129, 0.0142, 0.0095, 0.0289, 0.0478, 0.0239};
cannam@7 19
cannam@7 20 static double MinProfile[36] =
cannam@7 21 { 0.0375, 0.0682, 0.0299, 0.0119, 0.0138, 0.0093, 0.0296, 0.0543, 0.0257,
cannam@7 22 0.0292, 0.0519, 0.0246, 0.0159, 0.0234, 0.0135, 0.0291, 0.0544, 0.0248,
cannam@7 23 0.0137, 0.0176, 0.0104, 0.0352, 0.0670, 0.0302, 0.0222, 0.0349, 0.0164,
cannam@7 24 0.0174, 0.0297, 0.0166, 0.0222, 0.0401, 0.0202, 0.0175, 0.0270, 0.0146};
cannam@7 25 //
cannam@40 26
cannam@7 27
cannam@7 28 //////////////////////////////////////////////////////////////////////
cannam@7 29 // Construction/Destruction
cannam@7 30 //////////////////////////////////////////////////////////////////////
cannam@7 31
cannam@9 32 GetKeyMode::GetKeyMode( int sampleRate, float tuningFrequency,
cannam@34 33 double hpcpAverage, double medianAverage ) :
cannam@34 34 m_hpcpAverage( hpcpAverage ),
cannam@34 35 m_medianAverage( medianAverage ),
cannam@34 36 m_ChrPointer(0),
cannam@34 37 m_DecimatedBuffer(0),
cannam@34 38 m_ChromaBuffer(0),
cannam@34 39 m_MeanHPCP(0),
cannam@34 40 m_MajCorr(0),
cannam@34 41 m_MinCorr(0),
cannam@34 42 m_Keys(0),
cannam@34 43 m_MedianFilterBuffer(0),
cannam@40 44 m_SortedBuffer(0),
cannam@40 45 m_keyStrengths(0)
cannam@7 46 {
cannam@34 47 m_DecimationFactor = 8;
cannam@34 48
cannam@34 49 // Chromagram configuration parameters
cannam@34 50 m_ChromaConfig.normalise = MathUtilities::NormaliseUnitMax;
cannam@34 51 m_ChromaConfig.FS = lrint(sampleRate/(double)m_DecimationFactor);
cannam@7 52
cannam@34 53 // Set C (= MIDI #12) as our base :
cannam@34 54 // This implies that key = 1 => Cmaj, key = 12 => Bmaj, key = 13 => Cmin, etc.
cannam@34 55 m_ChromaConfig.min = Pitch::getFrequencyForPitch
cannam@40 56 (48, 0, tuningFrequency);
cannam@34 57 m_ChromaConfig.max = Pitch::getFrequencyForPitch
cannam@34 58 (96, 0, tuningFrequency);
cannam@9 59
cannam@34 60 m_ChromaConfig.BPO = 36;
cannam@34 61 m_ChromaConfig.CQThresh = 0.0054;
cannam@9 62
cannam@34 63 // Chromagram inst.
cannam@34 64 m_Chroma = new Chromagram( m_ChromaConfig );
cannam@10 65
cannam@34 66 // Get calculated parameters from chroma object
cannam@34 67 m_ChromaFrameSize = m_Chroma->getFrameSize();
cannam@34 68 // override hopsize for this application
cannam@34 69 m_ChromaHopSize = m_ChromaFrameSize;
cannam@34 70 m_BPO = m_ChromaConfig.BPO;
cannam@10 71
cannam@40 72 // std::cerr << "chroma frame size = " << m_ChromaFrameSize << ", decimation factor = " << m_DecimationFactor << " therefore block size = " << getBlockSize() << std::endl;
cannam@40 73
cannam@34 74 // Chromagram average and estimated key median filter lengths
cannam@34 75 m_ChromaBuffersize = (int)ceil( m_hpcpAverage * m_ChromaConfig.FS/m_ChromaFrameSize );
cannam@34 76 m_MedianWinsize = (int)ceil( m_medianAverage * m_ChromaConfig.FS/m_ChromaFrameSize );
cannam@34 77
cannam@34 78 // Reset counters
cannam@34 79 m_bufferindex = 0;
cannam@34 80 m_ChromaBufferFilling = 0;
cannam@34 81 m_MedianBufferFilling = 0;
cannam@9 82
cannam@34 83 // Spawn objectc/arrays
cannam@34 84 m_DecimatedBuffer = new double[m_ChromaFrameSize];
cannam@34 85
cannam@34 86 m_ChromaBuffer = new double[m_BPO * m_ChromaBuffersize];
cannam@34 87 memset( m_ChromaBuffer, 0, sizeof(double) * m_BPO * m_ChromaBuffersize);
cannam@34 88
cannam@34 89 m_MeanHPCP = new double[m_BPO];
cannam@34 90
cannam@34 91 m_MajCorr = new double[m_BPO];
cannam@34 92 m_MinCorr = new double[m_BPO];
cannam@34 93 m_Keys = new double[2*m_BPO];
cannam@34 94
cannam@34 95 m_MedianFilterBuffer = new int[ m_MedianWinsize ];
cannam@34 96 memset( m_MedianFilterBuffer, 0, sizeof(int)*m_MedianWinsize);
cannam@34 97
cannam@34 98 m_SortedBuffer = new int[ m_MedianWinsize ];
cannam@34 99 memset( m_SortedBuffer, 0, sizeof(int)*m_MedianWinsize);
cannam@34 100
cannam@34 101 m_Decimator = new Decimator
cannam@34 102 ( m_ChromaFrameSize*m_DecimationFactor, m_DecimationFactor );
cannam@40 103
cannam@40 104 m_keyStrengths = new double[24];
cannam@7 105 }
cannam@7 106
cannam@7 107 GetKeyMode::~GetKeyMode()
cannam@7 108 {
cannam@7 109
cannam@34 110 delete m_Chroma;
cannam@34 111 delete m_Decimator;
cannam@34 112
cannam@34 113 delete [] m_DecimatedBuffer;
cannam@34 114 delete [] m_ChromaBuffer;
cannam@34 115 delete [] m_MeanHPCP;
cannam@34 116 delete [] m_MajCorr;
cannam@34 117 delete [] m_MinCorr;
cannam@34 118 delete [] m_Keys;
cannam@34 119 delete [] m_MedianFilterBuffer;
cannam@34 120 delete [] m_SortedBuffer;
cannam@40 121
cannam@40 122 delete[] m_keyStrengths;
cannam@7 123 }
cannam@7 124
cannam@7 125 double GetKeyMode::krumCorr(double *pData1, double *pData2, unsigned int length)
cannam@7 126 {
cannam@34 127 double retVal= 0.0;
cannam@34 128
cannam@34 129 double num = 0;
cannam@34 130 double den = 0;
cannam@34 131 double mX = MathUtilities::mean( pData1, length );
cannam@34 132 double mY = MathUtilities::mean( pData2, length );
cannam@34 133
cannam@34 134 double sum1 = 0;
cannam@34 135 double sum2 = 0;
cannam@34 136
cannam@34 137 for( unsigned int i = 0; i <length; i++ )
cannam@34 138 {
cannam@34 139 num += ( pData1[i] - mX ) * ( pData2[i] - mY );
cannam@7 140
cannam@34 141 sum1 += ( (pData1[i]-mX) * (pData1[i]-mX) );
cannam@34 142 sum2 += ( (pData2[i]-mY) * (pData2[i]-mY) );
cannam@34 143 }
cannam@34 144
cannam@34 145 den = sqrt(sum1 * sum2);
cannam@34 146
cannam@34 147 if( den>0 )
cannam@34 148 retVal = num/den;
cannam@34 149 else
cannam@34 150 retVal = 0;
cannam@7 151
cannam@7 152
cannam@34 153 return retVal;
cannam@7 154 }
cannam@7 155
cannam@7 156 int GetKeyMode::process(double *PCMData)
cannam@7 157 {
cannam@34 158 int key;
cannam@7 159
cannam@34 160 unsigned int j,k;
cannam@7 161
cannam@34 162 //////////////////////////////////////////////
cannam@34 163 m_Decimator->process( PCMData, m_DecimatedBuffer);
cannam@7 164
cannam@34 165 m_ChrPointer = m_Chroma->process( m_DecimatedBuffer );
cannam@7 166
chriss@15 167
cannam@34 168 // Move bins such that the centre of the base note is in the
cannam@34 169 // middle of its three bins :
cannam@34 170 // Added 21.11.07 by Chris Sutton based on debugging with Katy
cannam@34 171 // Noland + comparison with Matlab equivalent.
cannam@34 172 MathUtilities::circShift( m_ChrPointer, m_BPO, 1);
chriss@15 173
cannam@23 174 /*
cannam@34 175 std::cout << "raw chroma: ";
cannam@34 176 for (int ii = 0; ii < m_BPO; ++ii) {
cannam@34 177 std::cout << m_ChrPointer[ii] << " ";
cannam@34 178 }
cannam@34 179 std::cout << std::endl;
cannam@23 180 */
cannam@34 181 // populate hpcp values;
cannam@34 182 int cbidx;
cannam@34 183 for( j = 0; j < m_BPO; j++ )
cannam@34 184 {
cannam@34 185 cbidx = (m_bufferindex * m_BPO) + j;
cannam@34 186 m_ChromaBuffer[ cbidx ] = m_ChrPointer[j];
cannam@34 187 }
cannam@7 188
cannam@34 189 //keep track of input buffers;
cannam@34 190 if( m_bufferindex++ >= m_ChromaBuffersize - 1)
cannam@34 191 m_bufferindex = 0;
cannam@7 192
cannam@34 193 // track filling of chroma matrix
cannam@34 194 if( m_ChromaBufferFilling++ >= m_ChromaBuffersize)
cannam@34 195 m_ChromaBufferFilling = m_ChromaBuffersize;
cannam@7 196
cannam@34 197 //calculate mean
cannam@34 198 for( k = 0; k < m_BPO; k++ )
cannam@34 199 {
cannam@34 200 double mnVal = 0.0;
cannam@34 201 for( j = 0; j < m_ChromaBufferFilling; j++ )
cannam@34 202 {
cannam@34 203 mnVal += m_ChromaBuffer[ k + (j*m_BPO) ];
cannam@34 204 }
cannam@7 205
cannam@34 206 m_MeanHPCP[k] = mnVal/(double)m_ChromaBufferFilling;
cannam@34 207 }
cannam@7 208
cannam@7 209
cannam@34 210 for( k = 0; k < m_BPO; k++ )
cannam@34 211 {
cannam@34 212 m_MajCorr[k] = krumCorr( m_MeanHPCP, MajProfile, m_BPO );
cannam@34 213 m_MinCorr[k] = krumCorr( m_MeanHPCP, MinProfile, m_BPO );
cannam@7 214
cannam@34 215 MathUtilities::circShift( MajProfile, m_BPO, 1 );
cannam@34 216 MathUtilities::circShift( MinProfile, m_BPO, 1 );
cannam@34 217 }
chriss@15 218
cannam@34 219 for( k = 0; k < m_BPO; k++ )
cannam@34 220 {
cannam@34 221 m_Keys[k] = m_MajCorr[k];
cannam@34 222 m_Keys[k+m_BPO] = m_MinCorr[k];
cannam@34 223 }
chriss@15 224
cannam@40 225 for (k = 0; k < 24; ++k) {
cannam@40 226 m_keyStrengths[k] = 0;
cannam@40 227 }
cannam@40 228
cannam@40 229 for( k = 0; k < m_BPO*2; k++ )
cannam@40 230 {
cannam@40 231 m_keyStrengths[k/(m_BPO/12)] += m_Keys[k];
cannam@40 232 }
chriss@15 233
cannam@23 234 /*
cannam@34 235 std::cout << "raw keys: ";
cannam@34 236 for (int ii = 0; ii < 2*m_BPO; ++ii) {
cannam@34 237 std::cout << m_Keys[ii] << " ";
cannam@34 238 }
cannam@34 239 std::cout << std::endl;
cannam@23 240 */
cannam@34 241 double dummy;
cannam@34 242 // '1 +' because we number keys 1-24, not 0-23.
cannam@34 243 key = 1 + (int)ceil( (double)MathUtilities::getMax( m_Keys, 2* m_BPO, &dummy )/3 );
cannam@9 244
cannam@23 245 // std::cout << "key pre-sorting: " << key << std::endl;
cannam@7 246
cannam@7 247
cannam@34 248 //Median filtering
cannam@7 249
cannam@34 250 // track Median buffer initial filling
cannam@34 251 if( m_MedianBufferFilling++ >= m_MedianWinsize)
cannam@34 252 m_MedianBufferFilling = m_MedianWinsize;
cannam@7 253
cannam@34 254 //shift median buffer
cannam@34 255 for( k = 1; k < m_MedianWinsize; k++ )
cannam@34 256 {
cannam@34 257 m_MedianFilterBuffer[ k - 1 ] = m_MedianFilterBuffer[ k ];
cannam@34 258 }
cannam@7 259
cannam@34 260 //write new key value into median buffer
cannam@34 261 m_MedianFilterBuffer[ m_MedianWinsize - 1 ] = key;
cannam@7 262
cannam@7 263
cannam@34 264 //Copy median into sorting buffer, reversed
cannam@34 265 unsigned int ijx = 0;
cannam@34 266 for( k = 0; k < m_MedianWinsize; k++ )
cannam@34 267 {
cannam@34 268 m_SortedBuffer[k] = m_MedianFilterBuffer[m_MedianWinsize-1-ijx];
cannam@34 269 ijx++;
cannam@34 270 }
cannam@7 271
cannam@34 272 qsort(m_SortedBuffer, m_MedianBufferFilling, sizeof(unsigned int),
cannam@34 273 MathUtilities::compareInt);
cannam@34 274 /*
cannam@34 275 std::cout << "sorted: ";
cannam@34 276 for (int ii = 0; ii < m_MedianBufferFilling; ++ii) {
cannam@34 277 std::cout << m_SortedBuffer[ii] << " ";
cannam@34 278 }
cannam@34 279 std::cout << std::endl;
cannam@34 280 */
cannam@34 281 int sortlength = m_MedianBufferFilling;
cannam@34 282 int midpoint = (int)ceil((double)sortlength/2);
cannam@7 283
cannam@34 284 if( midpoint <= 0 )
cannam@34 285 midpoint = 1;
cannam@7 286
cannam@34 287 key = m_SortedBuffer[midpoint-1];
cannam@7 288
cannam@34 289 return key;
cannam@7 290 }
cannam@7 291
cannam@7 292
cannam@43 293 bool GetKeyMode::isModeMinor( int key )
cannam@7 294 {
cannam@34 295 return (key > 12);
cannam@7 296 }