view src/Silvet.h @ 325:4cf4313d7e30 livemode

Always use q=0.8 and accept the hit on speed -- the templates are made for that configuration and it does work better. Also some adjustments to thresholding and peak picking for live mode in particular.
author Chris Cannam
date Mon, 18 May 2015 13:58:27 +0100
parents 213a51e197c8
children d25e4aee73d7
line wrap: on
line source
/* -*- c-basic-offset: 4 indent-tabs-mode: nil -*-  vi:set ts=8 sts=4 sw=4: */

/*
  Silvet

  A Vamp plugin for note transcription.
  Centre for Digital Music, Queen Mary University of London.
    
  This program is free software; you can redistribute it and/or
  modify it under the terms of the GNU General Public License as
  published by the Free Software Foundation; either version 2 of the
  License, or (at your option) any later version.  See the file
  COPYING included with this distribution for more information.
*/

#ifndef SILVET_H
#define SILVET_H

#include <vamp-sdk/Plugin.h>

#include <vector>
#include <string>
#include <set>

#include "MedianFilter.h"
#include "Instruments.h"

using std::string;
using std::vector;
using std::set;
using std::map;

class Resampler;
class CQSpectrogram;
class FlattenDynamics;

class Silvet : public Vamp::Plugin
{
public:
    Silvet(float inputSampleRate);
    virtual ~Silvet();

    string getIdentifier() const;
    string getName() const;
    string getDescription() const;
    string getMaker() const;
    int getPluginVersion() const;
    string getCopyright() const;

    InputDomain getInputDomain() const;
    size_t getPreferredBlockSize() const;
    size_t getPreferredStepSize() const;
    size_t getMinChannelCount() const;
    size_t getMaxChannelCount() const;

    ParameterList getParameterDescriptors() const;
    float getParameter(string identifier) const;
    void setParameter(string identifier, float value);

    ProgramList getPrograms() const;
    string getCurrentProgram() const;
    void selectProgram(string name);

    OutputList getOutputDescriptors() const;

    bool initialise(size_t channels, size_t stepSize, size_t blockSize);
    void reset();

    FeatureSet process(const float *const *inputBuffers,
                       Vamp::RealTime timestamp);

    FeatureSet getRemainingFeatures();

    enum ProcessingMode { // ordered so draft==0 and hq==1 as in prior releases
        DraftMode = 0,
        HighQualityMode = 1,
        LiveMode = 2,
    };

protected:
    const std::vector<InstrumentPack> m_instruments;
    const std::vector<InstrumentPack> m_liveInstruments;

    const InstrumentPack &getPack(int instrument) const {
        if (m_mode == LiveMode) {
            return m_liveInstruments[instrument];
        } else {
            return m_instruments[instrument];
        }
    }
    
    Resampler *m_resampler;
    FlattenDynamics *m_flattener;
    CQSpectrogram *m_cq;

    ProcessingMode m_mode;
    
    bool m_fineTuning;
    int m_instrument;
    int m_colsPerSec;

    typedef vector<vector<double> > Grid;

    vector<MedianFilter<double> *> m_postFilter;
    vector<map<int, double> > m_pianoRoll;
    vector<map<int, int> > m_pianoRollShifts;
    map<Vamp::RealTime, float> m_inputGains;
    set<int> m_current;

    Grid preProcess(const Grid &);

    std::pair<vector<double>, vector<int> > applyEM(const InstrumentPack &pack,
                                                    const vector<double> &column,
                                                    bool wantShifts);
    
    void postProcess(const vector<double> &pitches,
                     const vector<int> &bestShifts,
                     bool wantShifts); // -> piano roll column

    std::pair<FeatureList, FeatureList> noteTrack(int shiftCount); // notes, onsets

    void emitNote(int start, int end, int note, int shiftCount,
                  FeatureList &noteFeatures);

    void emitOnset(int start, int note, int shiftCount,
                  FeatureList &noteFeatures);
    
    Vamp::RealTime getColumnTimestamp(int column);
    
    Feature makeNoteFeature(int start, int end, int note, int shift,
                            int shiftCount, double strength);
    Feature makeOnsetFeature(int start, int note, int shift,
                             int shiftCount, double strength);

    int getVelocityFor(double strength, int column);
    
    float getInputGainAt(Vamp::RealTime t);

    void insertTemplateFeatures(FeatureSet &);
    
    void transcribe(const Grid &, FeatureSet &);

    string getChromaName(int n) const;
    string getNoteName(int n, int shift, int shiftCount) const;
    float getNoteFrequency(int n, int shift, int shiftCount) const;

    int m_blockSize;
    int m_columnCount;
    int m_resampledCount;
    Vamp::RealTime m_startTime;
    bool m_haveStartTime;

    mutable int m_notesOutputNo;
    mutable int m_onsetsOutputNo;
    mutable int m_fcqOutputNo;
    mutable int m_pitchOutputNo;
    mutable int m_templateOutputNo;
    mutable int m_chromaOutputNo;
};

#endif