annotate src/Silvet.h @ 372:af71cbdab621 tip

Update bqvec code
author Chris Cannam
date Tue, 19 Nov 2019 10:13:32 +0000
parents a3fc6e1f2d4e
children
rev   line source
Chris@31 1 /* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */
Chris@31 2
Chris@31 3 /*
Chris@31 4 Silvet
Chris@31 5
Chris@31 6 A Vamp plugin for note transcription.
Chris@31 7 Centre for Digital Music, Queen Mary University of London.
Chris@31 8
Chris@31 9 This program is free software; you can redistribute it and/or
Chris@31 10 modify it under the terms of the GNU General Public License as
Chris@31 11 published by the Free Software Foundation; either version 2 of the
Chris@31 12 License, or (at your option) any later version. See the file
Chris@31 13 COPYING included with this distribution for more information.
Chris@31 14 */
Chris@31 15
Chris@31 16 #ifndef SILVET_H
Chris@31 17 #define SILVET_H
Chris@31 18
Chris@31 19 #include <vamp-sdk/Plugin.h>
Chris@31 20
Chris@32 21 #include <vector>
Chris@32 22 #include <string>
Chris@41 23 #include <set>
Chris@32 24
Chris@152 25 #include "MedianFilter.h"
Chris@161 26 #include "Instruments.h"
Chris@32 27
Chris@352 28 #ifndef MAX_EM_THREADS
Chris@352 29 #define MAX_EM_THREADS 8
Chris@352 30 #endif
Chris@352 31
Chris@31 32 using std::string;
Chris@32 33 using std::vector;
Chris@41 34 using std::set;
Chris@55 35 using std::map;
Chris@31 36
Chris@31 37 class Resampler;
Chris@145 38 class CQSpectrogram;
Chris@246 39 class FlattenDynamics;
Chris@31 40
Chris@31 41 class Silvet : public Vamp::Plugin
Chris@31 42 {
Chris@31 43 public:
Chris@31 44 Silvet(float inputSampleRate);
Chris@31 45 virtual ~Silvet();
Chris@31 46
Chris@31 47 string getIdentifier() const;
Chris@31 48 string getName() const;
Chris@31 49 string getDescription() const;
Chris@31 50 string getMaker() const;
Chris@31 51 int getPluginVersion() const;
Chris@31 52 string getCopyright() const;
Chris@31 53
Chris@31 54 InputDomain getInputDomain() const;
Chris@31 55 size_t getPreferredBlockSize() const;
Chris@31 56 size_t getPreferredStepSize() const;
Chris@31 57 size_t getMinChannelCount() const;
Chris@31 58 size_t getMaxChannelCount() const;
Chris@31 59
Chris@31 60 ParameterList getParameterDescriptors() const;
Chris@31 61 float getParameter(string identifier) const;
Chris@31 62 void setParameter(string identifier, float value);
Chris@31 63
Chris@31 64 ProgramList getPrograms() const;
Chris@31 65 string getCurrentProgram() const;
Chris@31 66 void selectProgram(string name);
Chris@31 67
Chris@31 68 OutputList getOutputDescriptors() const;
Chris@31 69
Chris@31 70 bool initialise(size_t channels, size_t stepSize, size_t blockSize);
Chris@31 71 void reset();
Chris@31 72
Chris@31 73 FeatureSet process(const float *const *inputBuffers,
Chris@31 74 Vamp::RealTime timestamp);
Chris@31 75
Chris@31 76 FeatureSet getRemainingFeatures();
Chris@31 77
Chris@341 78 enum ProcessingMode {
Chris@341 79 LiveMode = 0,
Chris@316 80 HighQualityMode = 1,
Chris@316 81 };
Chris@316 82
Chris@31 83 protected:
Chris@161 84 const std::vector<InstrumentPack> m_instruments;
Chris@298 85 const std::vector<InstrumentPack> m_liveInstruments;
Chris@161 86
Chris@298 87 const InstrumentPack &getPack(int instrument) const {
Chris@298 88 if (m_mode == LiveMode) {
Chris@298 89 return m_liveInstruments[instrument];
Chris@298 90 } else {
Chris@298 91 return m_instruments[instrument];
Chris@298 92 }
Chris@298 93 }
Chris@298 94
Chris@31 95 Resampler *m_resampler;
Chris@246 96 FlattenDynamics *m_flattener;
Chris@145 97 CQSpectrogram *m_cq;
Chris@32 98
Chris@297 99 ProcessingMode m_mode;
Chris@297 100
Chris@166 101 bool m_fineTuning;
Chris@162 102 int m_instrument;
Chris@165 103 int m_colsPerSec;
Chris@110 104
Chris@32 105 typedef vector<vector<double> > Grid;
Chris@32 106
Chris@41 107 vector<MedianFilter<double> *> m_postFilter;
Chris@55 108 vector<map<int, double> > m_pianoRoll;
Chris@168 109 vector<map<int, int> > m_pianoRollShifts;
Chris@252 110 map<Vamp::RealTime, float> m_inputGains;
Chris@325 111 set<int> m_current;
Chris@41 112
Chris@32 113 Grid preProcess(const Grid &);
Chris@166 114
Chris@311 115 std::pair<vector<double>, vector<int> > applyEM(const InstrumentPack &pack,
Chris@336 116 const vector<double> &column);
Chris@311 117
Chris@321 118 void postProcess(const vector<double> &pitches,
Chris@336 119 const vector<int> &bestShifts); // -> piano roll column
Chris@166 120
Chris@336 121 struct FeatureChunk {
Chris@336 122 FeatureList notes;
Chris@336 123 FeatureList onsets;
Chris@336 124 FeatureList onOffsets;
Chris@336 125 };
Chris@166 126
Chris@336 127 int getShiftCount() const;
Chris@336 128
Chris@336 129 FeatureChunk noteTrack(); // notes, on/offsets
Chris@336 130
Chris@343 131 void emitNoteAndOffset(int start, int end, int note,
Chris@343 132 FeatureList &noteFeatures,
Chris@343 133 FeatureList &onOffsetFeatures);
Chris@319 134
Chris@336 135 void emitOnset(int start, int note,
Chris@336 136 FeatureList &onOffsetFeatures);
Chris@336 137
Chris@309 138 Vamp::RealTime getColumnTimestamp(int column);
Chris@309 139
Chris@336 140 Feature makeNoteFeature(int start, int end, int note, int shift, double strength);
Chris@336 141 Feature makeOnsetFeature(int start, int note, int shift, double strength);
Chris@336 142 Feature makeOffsetFeature(int col, int note, int shift);
Chris@252 143
Chris@320 144 int getVelocityFor(double strength, int column);
Chris@320 145
Chris@252 146 float getInputGainAt(Vamp::RealTime t);
Chris@252 147
Chris@302 148 void insertTemplateFeatures(FeatureSet &);
Chris@302 149
Chris@302 150 void transcribe(const Grid &, FeatureSet &);
Chris@31 151
Chris@320 152 string getChromaName(int n) const;
Chris@336 153 string getNoteName(int n, int shift) const;
Chris@336 154 float getNoteFrequency(int n, int shift) const;
Chris@38 155
Chris@31 156 int m_blockSize;
Chris@32 157 int m_columnCount;
Chris@272 158 int m_resampledCount;
Chris@40 159 Vamp::RealTime m_startTime;
Chris@313 160 bool m_haveStartTime;
Chris@32 161
Chris@32 162 mutable int m_notesOutputNo;
Chris@319 163 mutable int m_onsetsOutputNo;
Chris@336 164 mutable int m_onOffsetsOutputNo;
Chris@178 165 mutable int m_fcqOutputNo;
Chris@294 166 mutable int m_pitchOutputNo;
Chris@302 167 mutable int m_templateOutputNo;
Chris@309 168 mutable int m_chromaOutputNo;
Chris@31 169 };
Chris@31 170
Chris@31 171 #endif