silvet: src/Silvet.cpp comparison

comparison src/Silvet.cpp @ 316:f3e10617a60d livemode

Live mode enhancements: Adjust processing parameters (for speed) and peak-pick pitch activations across frequency (to avoid neighbouring-semitone clusters)

author	Chris Cannam
date	Tue, 28 Apr 2015 12:21:40 +0100
parents	f98ba4f47e49
children	92293058368a

comparison

equal deleted inserted replaced

-:dec47312ed40
+:f3e10617a60d
 static int binsPerSemitoneNormal = 5;
 static int minInputSampleRate = 100;
 static int maxInputSampleRate = 192000;
+static const Silvet::ProcessingMode defaultMode = Silvet::HighQualityMode;
 Silvet::Silvet(float inputSampleRate) :
 Plugin(inputSampleRate),
 m_instruments(InstrumentPack::listInstrumentPacks()),
 m_liveInstruments(LiveAdapter::adaptAll(m_instruments)),
 m_resampler(0),
 m_flattener(0),
 m_cq(0),
-m_mode(HighQualityMode),
+m_mode(defaultMode),
 m_fineTuning(false),
 m_instrument(0),
 m_colsPerSec(50),
 m_haveStartTime(false)
 {
 desc.name = "Processing mode";
 desc.unit = "";
 desc.description = "Sets the tradeoff of processing speed against transcription quality. Draft mode is tuned in favour of overall speed; Live mode is tuned in favour of lower latency; while Intensive mode (the default) will almost always produce the best results.";
 desc.minValue = 0;
 desc.maxValue = 2;
-desc.defaultValue = 1;
+desc.defaultValue = int(defaultMode);
 desc.isQuantized = true;
 desc.quantizeStep = 1;
 desc.valueNames.push_back("Draft (faster)");
 desc.valueNames.push_back("Intensive (higher quality)");
 desc.valueNames.push_back("Live (lower latency)");
 CQParameters params(processingSampleRate,
 minFreq,
 maxFreq,
 bpo);
-params.q = 0.95; // MIREX code uses 0.8, but it seems 0.9 or lower
+// For params.q, the MIREX code uses 0.8, but it seems that with
-// drops the FFT size to 512 from 1024 and alters
+// atomHopFactor of 0.3, using q == 0.9 or lower drops the FFT
-// some other processing parameters, making
+// size to 512 from 1024 and alters some other processing
-// everything much, much slower. Could be a flaw
+// parameters, making everything much, much slower. Could be a
-// in the CQ parameter calculations, must check
+// flaw in the CQ parameter calculations, must check. For
-params.atomHopFactor = 0.3;
+// atomHopFactor == 1, q == 0.8 is fine
+params.q = (m_mode == HighQualityMode ? 0.95 : 0.8);
+params.atomHopFactor = (m_mode == HighQualityMode ? 0.3 : 1.0);
 params.threshold = 0.0005;
 params.window = CQParameters::Hann;
 m_cq = new CQSpectrogram(params, CQSpectrogram::InterpolateLinear);
 for (int j = 0; j < pack.templateNoteCount; ++j) {
 m_postFilter[j]->push(pitches[j]);
 filtered.push_back(m_postFilter[j]->get());
 }
+if (m_mode == LiveMode) {
+// In live mode with only a 12-bpo CQ, we are very likely to
+// get clusters of two or three high scores at a time for
+// neighbouring semitones. Eliminate these by picking only the
+// peaks. This means we can't recognise actual semitone chords
+// if they ever appear, but it's not as if live mode is good
+// enough for that to be a big deal anyway.
+for (int j = 0; j < pack.templateNoteCount; ++j) {
+if (j > 0 && j + 1 < pack.templateNoteCount &&
+filtered[j] >= filtered[j-1] &&
+filtered[j] >= filtered[j+1]) {
+} else {
+filtered[j] = 0.0;
+}
+}
+}
 // Threshold for level and reduce number of candidate pitches
 typedef std::multimap<double, int> ValueIndexMap;
 ValueIndexMap strengths;
 }
 }
 int v;
 if (m_mode == LiveMode) {
-v = round(strength * 30);
+v = round(strength * 20);
 } else {
 v = round(strength * 2);
 }
 if (v > partVelocity) {
 partVelocity = v;

Mercurial > hg > silvet

comparison src/Silvet.cpp @ 316:f3e10617a60d livemode