qm-dsp: dsp/tempotracking/TempoTrackV2.cpp comparison

comparison dsp/tempotracking/TempoTrackV2.cpp @ 100:d7619173d43c mepd_new_params

Now includes latest changes from MEPD: * TempoTrackV2::calculatebeats method - exposes "alpha" and "tightness" parameters * TempoTrackV2::calculateBeatPeriod - user can specify an inputtempo (in BPM) and "constraintempo" (bool)

author	luisf <luis.figueira@eecs.qmul.ac.uk>
date	Wed, 12 Dec 2012 15:10:38 +0000
parents	e5907ae6de17
children	1e433aaa44ad

comparison

equal deleted inserted replaced

-:505ed5f42800
+:d7619173d43c
 a[1] = -0.3695;
 a[2] = 0.1958;
 b[0] = 0.2066;
 b[1] = 0.4131;
 b[2] = 0.2066;
 double inp1 = 0.;
 double inp2 = 0.;
 double out1 = 0.;
 double out2 = 0.;
 df[i] = lp_df[df.size()-i-1];
 }
 for (unsigned int i = 0;i < df.size();i++)
 {
 lp_df[i] = 0.;
 }
 inp1 = 0.; inp2 = 0.;
 out1 = 0.; out2 = 0.;
 df[i] = lp_df[df.size()-i-1];
 }
 }
+// MEPD 28/11/12
+// This function now allows for a user to specify an inputtempo (in BPM)
+// and a flag "constraintempo" which replaces the general rayleigh weighting for periodicities
+// with a gaussian which is centered around the input tempo
+// Note, if inputtempo = 120 and constraintempo = false, then functionality is
+// as it was before
 void
 TempoTrackV2::calculateBeatPeriod(const vector<double> &df,
 vector<double> &beat_period,
-vector<double> &tempi)
+vector<double> &tempi,
+double inputtempo, bool constraintempo)
 {
 // to follow matlab.. split into 512 sample frames with a 128 hop size
 // calculate the acf,
 // then the rcf.. and then stick the rcfs as columns of a matrix
 // then call viterbi decoding with weight vector and transition matrix
 // and get best path
 unsigned int wv_len = 128;
-double rayparam = 43.;
+// MEPD 28/11/12
+// the default value of inputtempo in the beat tracking plugin is 120
+// so if the user specifies a different inputtempo, the rayparam will be updated
+// accordingly.
+// note: 60*44100/512 is a magic number
+// this might (will?) break if a user specifies a different frame rate for the onset detection function
+double rayparam = (60*44100/512)/inputtempo;
+// these debug statements can be removed.
+std::cout << "inputtempo" << inputtempo << std::endl;
+std::cout << "rayparam" << rayparam << std::endl;
+std::cout << "constraintempo" << constraintempo << std::endl;
 // make rayleigh weighting curve
 d_vec_t wv(wv_len);
-for (unsigned int i=0; i<wv.size(); i++)
-{
+// check whether or not to use rayleigh weighting (if constraintempo is false)
-wv[i] = (static_cast<double> (i) / pow(rayparam,2.)) * exp((-1.*pow(-static_cast<double> (i),2.)) / (2.*pow(rayparam,2.)));
+// or use gaussian weighting it (constraintempo is true)
+if (constraintempo)
+{
+for (unsigned int i=0; i<wv.size(); i++)
+{
+// MEPD 28/11/12
+// do a gaussian weighting instead of rayleigh
+wv[i] = exp( (-1.*pow((static_cast<double> (i)-rayparam),2.)) / (2.*pow(rayparam/4.,2.)) );
+}
+}
+else
+{
+for (unsigned int i=0; i<wv.size(); i++)
+{
+// MEPD 28/11/12
+// standard rayleigh weighting over periodicities
+wv[i] = (static_cast<double> (i) / pow(rayparam,2.)) * exp((-1.*pow(-static_cast<double> (i),2.)) / (2.*pow(rayparam,2.)));
+}
 }
 // beat tracking frame size (roughly 6 seconds) and hop (1.5 seconds)
 unsigned int winlen = 512;
 unsigned int step = 128;
 for (unsigned int k=0; k<winlen; k++)
 {
 dfframe[k] = df[i+k];
 }
 // get rcf vector for current frame
 d_vec_t rcf(wv_len);
 get_rcf(dfframe,wv,rcf);
 rcfmat.push_back( d_vec_t() ); // adds a new column
 col_counter++;
 for (unsigned int j=0; j<rcf.size(); j++)
 {
 rcfmat[col_counter].push_back( rcf[j] );
 }
 }
 // now call viterbi decoding function
 viterbi_decode(rcfmat,wv,beat_period,tempi);
 }
 MathUtilities::adaptiveThreshold(dfframe);
 d_vec_t acf(dfframe.size());
 for (unsigned int lag=0; lag<dfframe.size(); lag++)
 {
 double sum = 0.;
 double tmp = 0.;
 for (unsigned int n=0; n<(dfframe.size()-lag); n++)
 {
 tmp = dfframe[n] * dfframe[n+lag];
 sum += tmp;
 }
 acf[lag] = static_cast<double> (sum/ (dfframe.size()-lag));
 }
 // now apply comb filtering
 int numelem = 4;
 for (unsigned int i = 2;i < rcf.size();i++) // max beat period
 {
 for (int a = 1;a <= numelem;a++) // number of comb elements
 {
 for (int b = 1-a;b <= a-1;b++) // general state using normalisation of comb elements
 {
 rcf[i-1] += ( acf[(a*i+b)-1]*wv[i-1] ) / (2.*a-1.);	// calculate value for comb filter row
 }
 }
 }
 // apply adaptive threshold to rcf
 MathUtilities::adaptiveThreshold(rcf);
 double rcfsum =0.;
 for (unsigned int i=0; i<rcf.size(); i++)
 {
 rcf[i] += EPS ;
 rcfsum += rcf[i];
 d_mat_t tmat;
 for (unsigned int i=0;i<wv.size();i++)
 {
 tmat.push_back ( d_vec_t() ); // adds a new column
 for (unsigned int j=0; j<wv.size(); j++)
 {
 tmat[i].push_back(0.); // fill with zeros initially
 }
 }
 // variance of Gaussians in transition matrix
 // formed of Gaussians on diagonal - implies slow tempo change
 double sigma = 8.;
 // don't want really short beat periods, or really long ones
 for (unsigned int i=20;i <wv.size()-20; i++)
 {
 for (unsigned int j=20; j<wv.size()-20; j++)
 {
 double mu = static_cast<double>(i);
 tmat[i][j] = exp( (-1.*pow((j-mu),2.)) / (2.*pow(sigma,2.)) );
 }
 }
 for (unsigned int i=0;i <rcfmat.size(); i++)
 {
 delta.push_back( d_vec_t());
 psi.push_back( i_vec_t());
 for (unsigned int j=0; j<rcfmat[i].size(); j++)
 {
 delta[i].push_back(0.); // fill with zeros initially
 psi[i].push_back(0); // fill with zeros initially
 }
 }
 for (unsigned int j=0; j<Q; j++)
 {
 delta[0][j] = wv[j] * rcfmat[0][j];
 psi[0][j] = 0;
 }
 double deltasum = 0.;
 for (unsigned int i=0; i<Q; i++)
 {
 deltasum += delta[0][i];
 }
 for (unsigned int i=0; i<Q; i++)
 {
 delta[0][i] /= (deltasum + EPS);
 }
 for (unsigned int t=1; t<T; t++)
 {
 d_vec_t tmp_vec(Q);
 for (unsigned int j=0; j<Q; j++)
 {
 for (unsigned int i=0; i<Q; i++)
 {
 tmp_vec[i] = delta[t-1][i] * tmat[j][i];
 }
 delta[t][j] = get_max_val(tmp_vec);
 psi[t][j] = get_max_ind(tmp_vec);
 delta[t][j] *= rcfmat[t][j];
 }
 // normalise current delta column
 double deltasum = 0.;
 for (unsigned int i=0; i<Q; i++)
 {
 deltasum += delta[t][i];
 }
 for (unsigned int i=0; i<Q; i++)
 {
 delta[t][i] /= (deltasum + EPS);
 }
 }
 i_vec_t bestpath(T);
 d_vec_t tmp_vec(Q);
 for (unsigned int i=0; i<Q; i++)
 {
 tmp_vec[i] = delta[T-1][i];
 }
 // find starting point - best beat period for "last" frame
 bestpath[T-1] = get_max_ind(tmp_vec);
 // backtrace through index of maximum values in psi
 for (unsigned int t=T-2; t>0 ;t--)
 {
 bestpath[t] = psi[t+1][bestpath[t+1]];
 }
 // weird but necessary hack -- couldn't get above loop to terminate at t >= 0
 bestpath[0] = psi[1][bestpath[1]];
 unsigned int lastind = 0;
 for (unsigned int i=0; i<T; i++)
 {
 unsigned int step = 128;
 for (unsigned int j=0; j<step; j++)
 {
 lastind = i*step+j;
 beat_period[lastind] = bestpath[i];
 if (maxval < df[i])
 {
 maxval = df[i];
 }
 }
 return maxval;
 }
 int
 TempoTrackV2::get_max_ind(const d_vec_t &df)
 {
 maxval = df[i];
 ind = i;
 }
 }
 return ind;
 }
 void
 TempoTrackV2::normalise_vec(d_vec_t &df)
 double sum = 0.;
 for (unsigned int i=0; i<df.size(); i++)
 {
 sum += df[i];
 }
 for (unsigned int i=0; i<df.size(); i++)
 {
 df[i]/= (sum + EPS);
 }
 }
+// MEPD 28/11/12
+// this function has been updated to allow the "alpha" and "tightness" parameters
+// of the dynamic program to be set by the user
+// the default value of alpha = 0.9 and tightness = 4
 void
 TempoTrackV2::calculateBeats(const vector<double> &df,
 const vector<double> &beat_period,
-vector<double> &beats)
+vector<double> &beats, double alpha, double tightness)
 {
 if (df.empty() || beat_period.empty()) return;
 d_vec_t cumscore(df.size()); // store cumulative score
 i_vec_t backlink(df.size()); // backlink (stores best beat locations at each time instant)
 {
 localscore[i] = df[i];
 backlink[i] = -1;
 }
-double tightness = 4.;
+//double tightness = 4.;
-double alpha = 0.9;
+//double alpha = 0.9;
+// MEPD 28/11/12
+// debug statements that can be removed.
+std::cout << "alpha" << alpha << std::endl;
+std::cout << "tightness" << tightness << std::endl;
 // main loop
 for (unsigned int i=0; i<localscore.size(); i++)
 {
 int prange_min = -2*beat_period[i];
 // IF IN THE ALLOWED RANGE, THEN LOOK AT CUMSCORE[I+PRANGE_MIN+J
 // ELSE LEAVE AT DEFAULT VALUE FROM INITIALISATION:  D_VEC_T SCORECANDS (TXWT.SIZE());
 int cscore_ind = i+prange_min+j;
 if (cscore_ind >= 0)
 {
 scorecands[j] = txwt[j] * cumscore[cscore_ind];
 }
 }
 // STARTING POINT, I.E. LAST BEAT.. PICK A STRONG POINT IN cumscore VECTOR
 d_vec_t tmp_vec;
 for (unsigned int i=cumscore.size() - beat_period[beat_period.size()-1] ; i<cumscore.size(); i++)
 {
 tmp_vec.push_back(cumscore[i]);
 }
 int startpoint = get_max_ind(tmp_vec) + cumscore.size() - beat_period[beat_period.size()-1] ;
 // can happen if no results obtained earlier (e.g. input too short)
 if (startpoint >= backlink.size()) startpoint = backlink.size()-1;
 //        std::cerr << "backlink[" << ibeats.back() << "] = " << backlink[ibeats.back()] << std::endl;
 int b = ibeats.back();
 if (backlink[b] == b) break; // shouldn't happen... haha
 ibeats.push_back(backlink[b]);
 }
 // REVERSE SEQUENCE OF IBEATS AND STORE AS BEATS
 for (unsigned int i=0; i<ibeats.size(); i++)
 {
 beats.push_back( static_cast<double>(ibeats[ibeats.size()-i-1]) );
 }
 }

Mercurial > hg > qm-dsp

comparison dsp/tempotracking/TempoTrackV2.cpp @ 100:d7619173d43c mepd_new_params