annotate src/Silvet.h @ 343:460cabb27bf7

Make the onset/offset output consistent with the notes output in terms of restarting notes when a shift changes
author Chris Cannam
date Wed, 12 Aug 2015 14:50:30 +0100
parents 705d807ca2ca
children a3fc6e1f2d4e
rev   line source
Chris@31 1 /* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */
Chris@31 2
Chris@31 3 /*
Chris@31 4 Silvet
Chris@31 5
Chris@31 6 A Vamp plugin for note transcription.
Chris@31 7 Centre for Digital Music, Queen Mary University of London.
Chris@31 8
Chris@31 9 This program is free software; you can redistribute it and/or
Chris@31 10 modify it under the terms of the GNU General Public License as
Chris@31 11 published by the Free Software Foundation; either version 2 of the
Chris@31 12 License, or (at your option) any later version. See the file
Chris@31 13 COPYING included with this distribution for more information.
Chris@31 14 */
Chris@31 15
Chris@31 16 #ifndef SILVET_H
Chris@31 17 #define SILVET_H
Chris@31 18
Chris@31 19 #include <vamp-sdk/Plugin.h>
Chris@31 20
Chris@32 21 #include <vector>
Chris@32 22 #include <string>
Chris@41 23 #include <set>
Chris@32 24
Chris@152 25 #include "MedianFilter.h"
Chris@161 26 #include "Instruments.h"
Chris@32 27
Chris@31 28 using std::string;
Chris@32 29 using std::vector;
Chris@41 30 using std::set;
Chris@55 31 using std::map;
Chris@31 32
Chris@31 33 class Resampler;
Chris@145 34 class CQSpectrogram;
Chris@246 35 class FlattenDynamics;
Chris@31 36
Chris@31 37 class Silvet : public Vamp::Plugin
Chris@31 38 {
Chris@31 39 public:
Chris@31 40 Silvet(float inputSampleRate);
Chris@31 41 virtual ~Silvet();
Chris@31 42
Chris@31 43 string getIdentifier() const;
Chris@31 44 string getName() const;
Chris@31 45 string getDescription() const;
Chris@31 46 string getMaker() const;
Chris@31 47 int getPluginVersion() const;
Chris@31 48 string getCopyright() const;
Chris@31 49
Chris@31 50 InputDomain getInputDomain() const;
Chris@31 51 size_t getPreferredBlockSize() const;
Chris@31 52 size_t getPreferredStepSize() const;
Chris@31 53 size_t getMinChannelCount() const;
Chris@31 54 size_t getMaxChannelCount() const;
Chris@31 55
Chris@31 56 ParameterList getParameterDescriptors() const;
Chris@31 57 float getParameter(string identifier) const;
Chris@31 58 void setParameter(string identifier, float value);
Chris@31 59
Chris@31 60 ProgramList getPrograms() const;
Chris@31 61 string getCurrentProgram() const;
Chris@31 62 void selectProgram(string name);
Chris@31 63
Chris@31 64 OutputList getOutputDescriptors() const;
Chris@31 65
Chris@31 66 bool initialise(size_t channels, size_t stepSize, size_t blockSize);
Chris@31 67 void reset();
Chris@31 68
Chris@31 69 FeatureSet process(const float *const *inputBuffers,
Chris@31 70 Vamp::RealTime timestamp);
Chris@31 71
Chris@31 72 FeatureSet getRemainingFeatures();
Chris@31 73
Chris@341 74 enum ProcessingMode {
Chris@341 75 LiveMode = 0,
Chris@316 76 HighQualityMode = 1,
Chris@316 77 };
Chris@316 78
Chris@31 79 protected:
Chris@161 80 const std::vector<InstrumentPack> m_instruments;
Chris@298 81 const std::vector<InstrumentPack> m_liveInstruments;
Chris@161 82
Chris@298 83 const InstrumentPack &getPack(int instrument) const {
Chris@298 84 if (m_mode == LiveMode) {
Chris@298 85 return m_liveInstruments[instrument];
Chris@298 86 } else {
Chris@298 87 return m_instruments[instrument];
Chris@298 88 }
Chris@298 89 }
Chris@298 90
Chris@31 91 Resampler *m_resampler;
Chris@246 92 FlattenDynamics *m_flattener;
Chris@145 93 CQSpectrogram *m_cq;
Chris@32 94
Chris@297 95 ProcessingMode m_mode;
Chris@297 96
Chris@166 97 bool m_fineTuning;
Chris@162 98 int m_instrument;
Chris@165 99 int m_colsPerSec;
Chris@110 100
Chris@32 101 typedef vector<vector<double> > Grid;
Chris@32 102
Chris@41 103 vector<MedianFilter<double> *> m_postFilter;
Chris@55 104 vector<map<int, double> > m_pianoRoll;
Chris@168 105 vector<map<int, int> > m_pianoRollShifts;
Chris@252 106 map<Vamp::RealTime, float> m_inputGains;
Chris@325 107 set<int> m_current;
Chris@41 108
Chris@32 109 Grid preProcess(const Grid &);
Chris@166 110
Chris@311 111 std::pair<vector<double>, vector<int> > applyEM(const InstrumentPack &pack,
Chris@336 112 const vector<double> &column);
Chris@311 113
Chris@321 114 void postProcess(const vector<double> &pitches,
Chris@336 115 const vector<int> &bestShifts); // -> piano roll column
Chris@166 116
Chris@336 117 struct FeatureChunk {
Chris@336 118 FeatureList notes;
Chris@336 119 FeatureList onsets;
Chris@336 120 FeatureList onOffsets;
Chris@336 121 };
Chris@166 122
Chris@336 123 int getShiftCount() const;
Chris@336 124
Chris@336 125 FeatureChunk noteTrack(); // notes, on/offsets
Chris@336 126
Chris@343 127 void emitNoteAndOffset(int start, int end, int note,
Chris@343 128 FeatureList &noteFeatures,
Chris@343 129 FeatureList &onOffsetFeatures);
Chris@319 130
Chris@336 131 void emitOnset(int start, int note,
Chris@336 132 FeatureList &onOffsetFeatures);
Chris@336 133
Chris@309 134 Vamp::RealTime getColumnTimestamp(int column);
Chris@309 135
Chris@336 136 Feature makeNoteFeature(int start, int end, int note, int shift, double strength);
Chris@336 137 Feature makeOnsetFeature(int start, int note, int shift, double strength);
Chris@336 138 Feature makeOffsetFeature(int col, int note, int shift);
Chris@252 139
Chris@320 140 int getVelocityFor(double strength, int column);
Chris@320 141
Chris@252 142 float getInputGainAt(Vamp::RealTime t);
Chris@252 143
Chris@302 144 void insertTemplateFeatures(FeatureSet &);
Chris@302 145
Chris@302 146 void transcribe(const Grid &, FeatureSet &);
Chris@31 147
Chris@320 148 string getChromaName(int n) const;
Chris@336 149 string getNoteName(int n, int shift) const;
Chris@336 150 float getNoteFrequency(int n, int shift) const;
Chris@38 151
Chris@31 152 int m_blockSize;
Chris@32 153 int m_columnCount;
Chris@272 154 int m_resampledCount;
Chris@40 155 Vamp::RealTime m_startTime;
Chris@313 156 bool m_haveStartTime;
Chris@32 157
Chris@32 158 mutable int m_notesOutputNo;
Chris@319 159 mutable int m_onsetsOutputNo;
Chris@336 160 mutable int m_onOffsetsOutputNo;
Chris@178 161 mutable int m_fcqOutputNo;
Chris@294 162 mutable int m_pitchOutputNo;
Chris@302 163 mutable int m_templateOutputNo;
Chris@309 164 mutable int m_chromaOutputNo;
Chris@31 165 };
Chris@31 166
Chris@31 167 #endif