qm-dsp: dsp/onsets/DetectionFunction.cpp annotate

annotate dsp/onsets/DetectionFunction.cpp @ 289:befe5aa6b450

* Refactor FFT a little bit so as to separate construction and processing rather than have a single static method -- will make it easier to use a different implementation * pull in KissFFT implementation (not hooked up yet)

author	Chris Cannam <c.cannam@qmul.ac.uk>
date	Wed, 13 May 2009 09:19:12 +0000
parents	9c403afdd9e9
children	e5907ae6de17

rev	line source
c@225	1 /* -- c-basic-offset: 4 indent-tabs-mode: nil -- vi:set ts=8 sts=4 sw=4: */
c@225	2
c@225	3 /*
c@225	4 QM DSP Library
c@225	5
c@225	6 Centre for Digital Music, Queen Mary, University of London.
c@225	7 This file copyright 2005-2006 Christian Landone.
c@225	8 All rights reserved.
c@225	9 */
c@225	10
c@225	11 #include "DetectionFunction.h"
c@272	12 #include <cstring>
c@225	13
c@225	14 //////////////////////////////////////////////////////////////////////
c@225	15 // Construction/Destruction
c@225	16 //////////////////////////////////////////////////////////////////////
c@225	17
c@225	18 DetectionFunction::DetectionFunction( DFConfig Config ) :
c@225	19 m_window(0)
c@225	20 {
c@227	21 m_magHistory = NULL;
c@227	22 m_phaseHistory = NULL;
c@227	23 m_phaseHistoryOld = NULL;
c@239	24 m_magPeaks = NULL;
c@225	25
c@225	26 initialise( Config );
c@225	27 }
c@225	28
c@225	29 DetectionFunction::~DetectionFunction()
c@225	30 {
c@225	31 deInitialise();
c@225	32 }
c@225	33
c@225	34
c@225	35 void DetectionFunction::initialise( DFConfig Config )
c@225	36 {
c@225	37 m_dataLength = Config.frameLength;
c@225	38 m_halfLength = m_dataLength/2;
c@239	39
c@225	40 m_DFType = Config.DFType;
c@238	41 m_stepSize = Config.stepSize;
c@225	42
c@239	43 m_whiten = Config.adaptiveWhitening;
c@239	44 m_whitenRelaxCoeff = Config.whiteningRelaxCoeff;
c@239	45 m_whitenFloor = Config.whiteningFloor;
c@239	46 if (m_whitenRelaxCoeff < 0) m_whitenRelaxCoeff = 0.9997;
c@239	47 if (m_whitenFloor < 0) m_whitenFloor = 0.01;
c@239	48
c@227	49 m_magHistory = new double[ m_halfLength ];
c@227	50 memset(m_magHistory,0, m_halfLength*sizeof(double));
c@225	51
c@227	52 m_phaseHistory = new double[ m_halfLength ];
c@227	53 memset(m_phaseHistory,0, m_halfLength*sizeof(double));
c@225	54
c@227	55 m_phaseHistoryOld = new double[ m_halfLength ];
c@227	56 memset(m_phaseHistoryOld,0, m_halfLength*sizeof(double));
c@225	57
c@239	58 m_magPeaks = new double[ m_halfLength ];
c@239	59 memset(m_magPeaks,0, m_halfLength*sizeof(double));
c@239	60
c@289	61 // See note in process(const double *) below
c@289	62 int actualLength = MathUtilities::previousPowerOfTwo(m_dataLength);
c@289	63 m_phaseVoc = new PhaseVocoder(actualLength);
c@225	64
c@225	65 m_DFWindowedFrame = new double[ m_dataLength ];
c@225	66 m_magnitude = new double[ m_halfLength ];
c@225	67 m_thetaAngle = new double[ m_halfLength ];
c@225	68
c@225	69 m_window = new Window<double>(HanningWindow, m_dataLength);
c@225	70 }
c@225	71
c@225	72 void DetectionFunction::deInitialise()
c@225	73 {
c@227	74 delete [] m_magHistory ;
c@227	75 delete [] m_phaseHistory ;
c@227	76 delete [] m_phaseHistoryOld ;
c@239	77 delete [] m_magPeaks ;
c@225	78
c@225	79 delete m_phaseVoc;
c@225	80
c@225	81 delete [] m_DFWindowedFrame;
c@225	82 delete [] m_magnitude;
c@225	83 delete [] m_thetaAngle;
c@225	84
c@225	85 delete m_window;
c@225	86 }
c@225	87
c@280	88 double DetectionFunction::process( const double *TDomain )
c@225	89 {
c@225	90 m_window->cut( TDomain, m_DFWindowedFrame );
c@280	91
c@280	92 // Our own FFT implementation supports power-of-two sizes only.
c@280	93 // If we have to use this implementation (as opposed to the
c@280	94 // version of process() below that operates on frequency domain
c@280	95 // data directly), we will have to use the next smallest power of
c@280	96 // two from the block size. Results may vary accordingly!
c@280	97
c@280	98 int actualLength = MathUtilities::previousPowerOfTwo(m_dataLength);
c@280	99
c@280	100 if (actualLength != m_dataLength) {
c@280	101 // Pre-fill mag and phase vectors with zero, as the FFT output
c@280	102 // will not fill the arrays
c@280	103 for (int i = actualLength/2; i < m_dataLength/2; ++i) {
c@280	104 m_magnitude[i] = 0;
c@280	105 m_thetaAngle[0] = 0;
c@280	106 }
c@280	107 }
c@280	108
c@289	109 m_phaseVoc->process(m_DFWindowedFrame, m_magnitude, m_thetaAngle);
c@225	110
c@239	111 if (m_whiten) whiten();
c@239	112
c@227	113 return runDF();
c@227	114 }
c@227	115
c@280	116 double DetectionFunction::process( const double magnitudes, const double phases )
c@227	117 {
c@227	118 for (size_t i = 0; i < m_halfLength; ++i) {
c@227	119 m_magnitude[i] = magnitudes[i];
c@227	120 m_thetaAngle[i] = phases[i];
c@227	121 }
c@227	122
c@239	123 if (m_whiten) whiten();
c@239	124
c@227	125 return runDF();
c@227	126 }
c@227	127
c@239	128 void DetectionFunction::whiten()
c@239	129 {
c@239	130 for (unsigned int i = 0; i < m_halfLength; ++i) {
c@239	131 double m = m_magnitude[i];
c@239	132 if (m < m_magPeaks[i]) {
c@239	133 m = m + (m_magPeaks[i] - m) * m_whitenRelaxCoeff;
c@239	134 }
c@239	135 if (m < m_whitenFloor) m = m_whitenFloor;
c@239	136 m_magPeaks[i] = m;
c@239	137 m_magnitude[i] /= m;
c@239	138 }
c@239	139 }
c@239	140
c@227	141 double DetectionFunction::runDF()
c@227	142 {
c@227	143 double retVal = 0;
c@227	144
c@225	145 switch( m_DFType )
c@225	146 {
c@225	147 case DF_HFC:
c@225	148 retVal = HFC( m_halfLength, m_magnitude);
c@225	149 break;
c@225	150
c@238	151 case DF_SPECDIFF:
c@225	152 retVal = specDiff( m_halfLength, m_magnitude);
c@225	153 break;
c@225	154
c@225	155 case DF_PHASEDEV:
c@239	156 retVal = phaseDev( m_halfLength, m_thetaAngle);
c@225	157 break;
c@225	158
c@225	159 case DF_COMPLEXSD:
c@225	160 retVal = complexSD( m_halfLength, m_magnitude, m_thetaAngle);
c@225	161 break;
c@237	162
c@237	163 case DF_BROADBAND:
c@239	164 retVal = broadband( m_halfLength, m_magnitude);
c@239	165 break;
c@225	166 }
c@225	167
c@225	168 return retVal;
c@225	169 }
c@225	170
c@225	171 double DetectionFunction::HFC(unsigned int length, double *src)
c@225	172 {
c@225	173 unsigned int i;
c@225	174 double val = 0;
c@225	175
c@225	176 for( i = 0; i < length; i++)
c@225	177 {
c@225	178 val += src[ i ] * ( i + 1);
c@225	179 }
c@225	180 return val;
c@225	181 }
c@225	182
c@225	183 double DetectionFunction::specDiff(unsigned int length, double *src)
c@225	184 {
c@225	185 unsigned int i;
c@225	186 double val = 0.0;
c@225	187 double temp = 0.0;
c@225	188 double diff = 0.0;
c@225	189
c@225	190 for( i = 0; i < length; i++)
c@225	191 {
c@227	192 temp = fabs( (src[ i ] * src[ i ]) - (m_magHistory[ i ] * m_magHistory[ i ]) );
c@225	193
c@225	194 diff= sqrt(temp);
c@225	195
c@238	196 // (See note in phaseDev below.)
c@238	197
c@238	198 val += diff;
c@225	199
c@227	200 m_magHistory[ i ] = src[ i ];
c@225	201 }
c@225	202
c@225	203 return val;
c@225	204 }
c@225	205
c@225	206
c@239	207 double DetectionFunction::phaseDev(unsigned int length, double *srcPhase)
c@225	208 {
c@225	209 unsigned int i;
c@225	210 double tmpPhase = 0;
c@225	211 double tmpVal = 0;
c@225	212 double val = 0;
c@225	213
c@225	214 double dev = 0;
c@225	215
c@225	216 for( i = 0; i < length; i++)
c@225	217 {
c@227	218 tmpPhase = (srcPhase[ i ]- 2*m_phaseHistory[ i ]+m_phaseHistoryOld[ i ]);
c@225	219 dev = MathUtilities::princarg( tmpPhase );
c@238	220
c@238	221 // A previous version of this code only counted the value here
c@238	222 // if the magnitude exceeded 0.1. My impression is that
c@238	223 // doesn't greatly improve the results for "loud" music (so
c@238	224 // long as the peak picker is reasonably sophisticated), but
c@238	225 // does significantly damage its ability to work with quieter
c@238	226 // music, so I'm removing it and counting the result always.
c@238	227 // Same goes for the spectral difference measure above.
c@225	228
c@238	229 tmpVal = fabs(dev);
c@238	230 val += tmpVal ;
c@225	231
c@227	232 m_phaseHistoryOld[ i ] = m_phaseHistory[ i ] ;
c@227	233 m_phaseHistory[ i ] = srcPhase[ i ];
c@225	234 }
c@225	235
c@225	236
c@225	237 return val;
c@225	238 }
c@225	239
c@225	240
c@225	241 double DetectionFunction::complexSD(unsigned int length, double srcMagnitude, double srcPhase)
c@225	242 {
c@225	243 unsigned int i;
c@225	244 double val = 0;
c@225	245 double tmpPhase = 0;
c@225	246 double tmpReal = 0;
c@225	247 double tmpImag = 0;
c@225	248
c@225	249 double dev = 0;
c@225	250 ComplexData meas = ComplexData( 0, 0 );
c@227	251 ComplexData j = ComplexData( 0, 1 );
c@225	252
c@225	253 for( i = 0; i < length; i++)
c@225	254 {
c@227	255 tmpPhase = (srcPhase[ i ]- 2*m_phaseHistory[ i ]+m_phaseHistoryOld[ i ]);
c@225	256 dev= MathUtilities::princarg( tmpPhase );
c@225	257
c@227	258 meas = m_magHistory[i] - ( srcMagnitude[ i ] * exp( j * dev) );
c@225	259
c@225	260 tmpReal = real( meas );
c@225	261 tmpImag = imag( meas );
c@225	262
c@225	263 val += sqrt( (tmpReal * tmpReal) + (tmpImag * tmpImag) );
c@225	264
c@227	265 m_phaseHistoryOld[ i ] = m_phaseHistory[ i ] ;
c@227	266 m_phaseHistory[ i ] = srcPhase[ i ];
c@227	267 m_magHistory[ i ] = srcMagnitude[ i ];
c@225	268 }
c@225	269
c@225	270 return val;
c@225	271 }
c@225	272
c@239	273 double DetectionFunction::broadband(unsigned int length, double *src)
c@237	274 {
c@237	275 double val = 0;
c@237	276 for (unsigned int i = 0; i < length; ++i) {
c@239	277 double sqrmag = src[i] * src[i];
c@237	278 if (m_magHistory[i] > 0.0) {
c@237	279 double diff = 10.0 * log10(sqrmag / m_magHistory[i]);
c@237	280 if (diff > m_dbRise) val = val + 1;
c@237	281 }
c@237	282 m_magHistory[i] = sqrmag;
c@237	283 }
c@237	284 return val;
c@237	285 }
c@237	286
c@225	287 double* DetectionFunction::getSpectrumMagnitude()
c@225	288 {
c@225	289 return m_magnitude;
c@225	290 }
c@225	291

Mercurial > hg > qm-dsp

annotate dsp/onsets/DetectionFunction.cpp @ 289:befe5aa6b450