annotate dsp/segmentation/ClusterMeltSegmenter.h @ 249:18a0dffa5c1a

* Various fixes to segmentation code
author Chris Cannam <c.cannam@qmul.ac.uk>
date Thu, 10 Jan 2008 15:14:53 +0000
parents cdfd0948a852
children d096a79fa772
rev   line source
c@249 1 /* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */
c@249 2
c@243 3 /*
c@249 4 * ClusterMeltSegmenter.h
c@243 5 *
c@249 6 * Created by Mark Levy on 23/03/2006.
c@249 7 * Copyright 2006 Centre for Digital Music, Queen Mary, University of London.
c@249 8 * All rights reserved.
c@243 9 */
c@243 10
c@243 11 #include <vector>
c@243 12
c@243 13 #include "segment.h"
c@243 14 #include "Segmenter.h"
c@245 15 #include "hmm/hmm.h"
c@245 16 #include "base/Window.h"
c@243 17
c@243 18 using std::vector;
c@243 19
c@249 20 class Decimator;
c@249 21 class ConstantQ;
c@249 22
c@249 23 class ClusterMeltSegmenterParams
c@249 24 // defaults are sensible for 11025Hz with 0.2 second hopsize
c@243 25 {
c@243 26 public:
c@249 27 ClusterMeltSegmenterParams() :
c@249 28 featureType(FEATURE_TYPE_CONSTQ),
c@249 29 hopSize(0.2),
c@249 30 windowSize(0.6),
c@249 31 fmin(62),
c@249 32 fmax(16000),
c@249 33 nbins(8),
c@249 34 ncomponents(20),
c@249 35 nHMMStates(40),
c@249 36 nclusters(10),
c@249 37 histogramLength(15),
c@249 38 neighbourhoodLimit(20) { }
c@249 39 feature_types featureType;
c@249 40 double hopSize; // in secs
c@249 41 double windowSize; // in secs
c@249 42 int fmin;
c@249 43 int fmax;
c@249 44 int nbins;
c@249 45 int ncomponents;
c@249 46 int nHMMStates;
c@249 47 int nclusters;
c@249 48 int histogramLength;
c@249 49 int neighbourhoodLimit;
c@243 50 };
c@243 51
c@243 52 class ClusterMeltSegmenter : public Segmenter
c@243 53 {
c@243 54 public:
c@249 55 ClusterMeltSegmenter(ClusterMeltSegmenterParams params);
c@249 56 virtual ~ClusterMeltSegmenter();
c@249 57 virtual void initialise(int samplerate);
c@249 58 virtual int getWindowsize();
c@249 59 virtual int getHopsize();
c@249 60 virtual void extractFeatures(const double* samples, int nsamples);
c@249 61 void setFeatures(const vector<vector<double> >& f); // provide the features yourself
c@249 62 virtual void segment(); // segment into default number of segment-types
c@249 63 void segment(int m); // segment into m segment-types
c@249 64 int getNSegmentTypes() { return nclusters; }
c@249 65
c@243 66 protected:
c@249 67 void makeSegmentation(int* q, int len);
c@243 68
c@249 69 Window<double> *window;
c@249 70 ConstantQ* constq;
c@249 71 model_t* model; // the HMM
c@249 72 int* q; // the decoded HMM state sequence
c@249 73 vector<vector<double> > histograms;
c@249 74
c@249 75 feature_types featureType;
c@249 76 double hopSize; // in seconds
c@249 77 double windowSize; // in seconds
c@249 78
c@249 79 // constant-Q parameters
c@249 80 int fmin;
c@249 81 int fmax;
c@249 82 int nbins;
c@249 83 int ncoeff;
c@249 84
c@249 85 // PCA parameters
c@249 86 int ncomponents;
c@249 87
c@249 88 // HMM parameters
c@249 89 int nHMMStates;
c@249 90
c@249 91 // clustering parameters
c@249 92 int nclusters;
c@249 93 int histogramLength;
c@249 94 int neighbourhoodLimit;
c@249 95
c@249 96 Decimator *decimator;
c@243 97 };