annotate VampYin.cpp @ 81:e6b234575df1 tony

added spurious file VampYin.cpp
author matthiasm
date Wed, 03 Dec 2014 14:49:54 +0000
parents
children
rev   line source
matthiasm@81 1 /* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */
matthiasm@81 2
matthiasm@81 3 /*
matthiasm@81 4 pYIN - A fundamental frequency estimator for monophonic audio
matthiasm@81 5 Centre for Digital Music, Queen Mary, University of London.
matthiasm@81 6
matthiasm@81 7 This program is free software; you can redistribute it and/or
matthiasm@81 8 modify it under the terms of the GNU General Public License as
matthiasm@81 9 published by the Free Software Foundation; either version 2 of the
matthiasm@81 10 License, or (at your option) any later version. See the file
matthiasm@81 11 COPYING included with this distribution for more information.
matthiasm@81 12 */
matthiasm@81 13
matthiasm@81 14 #include "YinVamp.h"
matthiasm@81 15 #include "MonoNote.h"
matthiasm@81 16
matthiasm@81 17 #include "vamp-sdk/FFT.h"
matthiasm@81 18
matthiasm@81 19 #include <vector>
matthiasm@81 20 #include <algorithm>
matthiasm@81 21
matthiasm@81 22 #include <cstdio>
matthiasm@81 23 #include <cmath>
matthiasm@81 24 #include <complex>
matthiasm@81 25
matthiasm@81 26 using std::string;
matthiasm@81 27 using std::vector;
matthiasm@81 28 using Vamp::RealTime;
matthiasm@81 29
matthiasm@81 30
matthiasm@81 31 YinVamp::YinVamp(float inputSampleRate) :
matthiasm@81 32 Plugin(inputSampleRate),
matthiasm@81 33 m_channels(0),
matthiasm@81 34 m_stepSize(256),
matthiasm@81 35 m_blockSize(2048),
matthiasm@81 36 m_fmin(40),
matthiasm@81 37 m_fmax(1000),
matthiasm@81 38 m_yin(2048, inputSampleRate, 0.0),
matthiasm@81 39 m_outNoF0(0),
matthiasm@81 40 m_outNoPeriodicity(0),
matthiasm@81 41 m_outNoRms(0),
matthiasm@81 42 m_outNoSalience(0),
matthiasm@81 43 m_yinParameter(0.15f),
matthiasm@81 44 m_outputUnvoiced(2.0f)
matthiasm@81 45 {
matthiasm@81 46 }
matthiasm@81 47
matthiasm@81 48 YinVamp::~YinVamp()
matthiasm@81 49 {
matthiasm@81 50 }
matthiasm@81 51
matthiasm@81 52 string
matthiasm@81 53 YinVamp::getIdentifier() const
matthiasm@81 54 {
matthiasm@81 55 return "yin";
matthiasm@81 56 }
matthiasm@81 57
matthiasm@81 58 string
matthiasm@81 59 YinVamp::getName() const
matthiasm@81 60 {
matthiasm@81 61 return "Yin";
matthiasm@81 62 }
matthiasm@81 63
matthiasm@81 64 string
matthiasm@81 65 YinVamp::getDescription() const
matthiasm@81 66 {
matthiasm@81 67 return "A vamp implementation of the Yin algorithm for monophonic frequency estimation.";
matthiasm@81 68 }
matthiasm@81 69
matthiasm@81 70 string
matthiasm@81 71 YinVamp::getMaker() const
matthiasm@81 72 {
matthiasm@81 73 return "Matthias Mauch";
matthiasm@81 74 }
matthiasm@81 75
matthiasm@81 76 int
matthiasm@81 77 YinVamp::getPluginVersion() const
matthiasm@81 78 {
matthiasm@81 79 // Increment this each time you release a version that behaves
matthiasm@81 80 // differently from the previous one
matthiasm@81 81 return 1;
matthiasm@81 82 }
matthiasm@81 83
matthiasm@81 84 string
matthiasm@81 85 YinVamp::getCopyright() const
matthiasm@81 86 {
matthiasm@81 87 return "GPL";
matthiasm@81 88 }
matthiasm@81 89
matthiasm@81 90 YinVamp::InputDomain
matthiasm@81 91 YinVamp::getInputDomain() const
matthiasm@81 92 {
matthiasm@81 93 return TimeDomain;
matthiasm@81 94 }
matthiasm@81 95
matthiasm@81 96 size_t
matthiasm@81 97 YinVamp::getPreferredBlockSize() const
matthiasm@81 98 {
matthiasm@81 99 return 2048;
matthiasm@81 100 }
matthiasm@81 101
matthiasm@81 102 size_t
matthiasm@81 103 YinVamp::getPreferredStepSize() const
matthiasm@81 104 {
matthiasm@81 105 return 256;
matthiasm@81 106 }
matthiasm@81 107
matthiasm@81 108 size_t
matthiasm@81 109 YinVamp::getMinChannelCount() const
matthiasm@81 110 {
matthiasm@81 111 return 1;
matthiasm@81 112 }
matthiasm@81 113
matthiasm@81 114 size_t
matthiasm@81 115 YinVamp::getMaxChannelCount() const
matthiasm@81 116 {
matthiasm@81 117 return 1;
matthiasm@81 118 }
matthiasm@81 119
matthiasm@81 120 YinVamp::ParameterList
matthiasm@81 121 YinVamp::getParameterDescriptors() const
matthiasm@81 122 {
matthiasm@81 123 ParameterList list;
matthiasm@81 124
matthiasm@81 125 ParameterDescriptor d;
matthiasm@81 126 d.identifier = "yinThreshold";
matthiasm@81 127 d.name = "Yin threshold";
matthiasm@81 128 d.description = "The greedy Yin search for a low value difference function is done once a dip lower than this threshold is reached.";
matthiasm@81 129 d.unit = "";
matthiasm@81 130 d.minValue = 0.025f;
matthiasm@81 131 d.maxValue = 1.0f;
matthiasm@81 132 d.defaultValue = 0.15f;
matthiasm@81 133 d.isQuantized = true;
matthiasm@81 134 d.quantizeStep = 0.025f;
matthiasm@81 135
matthiasm@81 136 list.push_back(d);
matthiasm@81 137
matthiasm@81 138 // d.identifier = "removeunvoiced";
matthiasm@81 139 // d.name = "Remove pitches classified as unvoiced.";
matthiasm@81 140 // d.description = "If ticked, then the pitch estimator will return the most likely pitch, even if it 'thinks' there isn't any.";
matthiasm@81 141 // d.unit = "";
matthiasm@81 142 // d.minValue = 0.0f;
matthiasm@81 143 // d.maxValue = 1.0f;
matthiasm@81 144 // d.defaultValue = 0.0f;
matthiasm@81 145 // d.isQuantized = true;
matthiasm@81 146 // d.quantizeStep = 1.0f;
matthiasm@81 147 // d.valueNames.clear();
matthiasm@81 148 // list.push_back(d);
matthiasm@81 149
matthiasm@81 150 d.identifier = "outputunvoiced";
matthiasm@81 151 d.valueNames.clear();
matthiasm@81 152 d.name = "Output estimates classified as unvoiced?";
matthiasm@81 153 d.description = ".";
matthiasm@81 154 d.unit = "";
matthiasm@81 155 d.minValue = 0.0f;
matthiasm@81 156 d.maxValue = 2.0f;
matthiasm@81 157 d.defaultValue = 2.0f;
matthiasm@81 158 d.isQuantized = true;
matthiasm@81 159 d.quantizeStep = 1.0f;
matthiasm@81 160 d.valueNames.push_back("No");
matthiasm@81 161 d.valueNames.push_back("Yes");
matthiasm@81 162 d.valueNames.push_back("Yes, as negative frequencies");
matthiasm@81 163 list.push_back(d);
matthiasm@81 164
matthiasm@81 165 return list;
matthiasm@81 166 }
matthiasm@81 167
matthiasm@81 168 float
matthiasm@81 169 YinVamp::getParameter(string identifier) const
matthiasm@81 170 {
matthiasm@81 171 if (identifier == "yinThreshold") {
matthiasm@81 172 return m_yinParameter;
matthiasm@81 173 }
matthiasm@81 174 if (identifier == "outputunvoiced") {
matthiasm@81 175 return m_outputUnvoiced;
matthiasm@81 176 }
matthiasm@81 177 return 0.f;
matthiasm@81 178 }
matthiasm@81 179
matthiasm@81 180 void
matthiasm@81 181 YinVamp::setParameter(string identifier, float value)
matthiasm@81 182 {
matthiasm@81 183 if (identifier == "yinThreshold")
matthiasm@81 184 {
matthiasm@81 185 m_yinParameter = value;
matthiasm@81 186 }
matthiasm@81 187 if (identifier == "outputunvoiced")
matthiasm@81 188 {
matthiasm@81 189 m_outputUnvoiced = value;
matthiasm@81 190 }
matthiasm@81 191 }
matthiasm@81 192
matthiasm@81 193 YinVamp::ProgramList
matthiasm@81 194 YinVamp::getPrograms() const
matthiasm@81 195 {
matthiasm@81 196 ProgramList list;
matthiasm@81 197 return list;
matthiasm@81 198 }
matthiasm@81 199
matthiasm@81 200 string
matthiasm@81 201 YinVamp::getCurrentProgram() const
matthiasm@81 202 {
matthiasm@81 203 return ""; // no programs
matthiasm@81 204 }
matthiasm@81 205
matthiasm@81 206 void
matthiasm@81 207 YinVamp::selectProgram(string name)
matthiasm@81 208 {
matthiasm@81 209 }
matthiasm@81 210
matthiasm@81 211 YinVamp::OutputList
matthiasm@81 212 YinVamp::getOutputDescriptors() const
matthiasm@81 213 {
matthiasm@81 214 OutputList outputs;
matthiasm@81 215
matthiasm@81 216 OutputDescriptor d;
matthiasm@81 217
matthiasm@81 218 int outputNumber = 0;
matthiasm@81 219
matthiasm@81 220 d.identifier = "f0";
matthiasm@81 221 d.name = "Estimated f0";
matthiasm@81 222 d.description = "Estimated fundamental frequency";
matthiasm@81 223 d.unit = "Hz";
matthiasm@81 224 d.hasFixedBinCount = true;
matthiasm@81 225 d.binCount = 1;
matthiasm@81 226 d.hasKnownExtents = true;
matthiasm@81 227 d.minValue = m_fmin;
matthiasm@81 228 d.maxValue = 500;
matthiasm@81 229 d.isQuantized = false;
matthiasm@81 230 d.sampleType = OutputDescriptor::FixedSampleRate;
matthiasm@81 231 d.sampleRate = (m_inputSampleRate / m_stepSize);
matthiasm@81 232 d.hasDuration = false;
matthiasm@81 233 outputs.push_back(d);
matthiasm@81 234 m_outNoF0 = outputNumber++;
matthiasm@81 235
matthiasm@81 236 d.identifier = "periodicity";
matthiasm@81 237 d.name = "Periodicity";
matthiasm@81 238 d.description = "by-product of Yin f0 estimation";
matthiasm@81 239 d.unit = "";
matthiasm@81 240 d.hasFixedBinCount = true;
matthiasm@81 241 d.binCount = 1;
matthiasm@81 242 d.hasKnownExtents = true;
matthiasm@81 243 d.minValue = 0;
matthiasm@81 244 d.maxValue = 1;
matthiasm@81 245 d.isQuantized = false;
matthiasm@81 246 d.sampleType = OutputDescriptor::FixedSampleRate;
matthiasm@81 247 d.sampleRate = (m_inputSampleRate / m_stepSize);
matthiasm@81 248 d.hasDuration = false;
matthiasm@81 249 outputs.push_back(d);
matthiasm@81 250 m_outNoPeriodicity = outputNumber++;
matthiasm@81 251
matthiasm@81 252 d.identifier = "rms";
matthiasm@81 253 d.name = "Root mean square";
matthiasm@81 254 d.description = "Root mean square of the waveform.";
matthiasm@81 255 d.unit = "";
matthiasm@81 256 d.hasFixedBinCount = true;
matthiasm@81 257 d.binCount = 1;
matthiasm@81 258 d.hasKnownExtents = true;
matthiasm@81 259 d.minValue = 0;
matthiasm@81 260 d.maxValue = 1;
matthiasm@81 261 d.isQuantized = false;
matthiasm@81 262 d.sampleType = OutputDescriptor::FixedSampleRate;
matthiasm@81 263 d.sampleRate = (m_inputSampleRate / m_stepSize);
matthiasm@81 264 d.hasDuration = false;
matthiasm@81 265 outputs.push_back(d);
matthiasm@81 266 m_outNoRms = outputNumber++;
matthiasm@81 267
matthiasm@81 268 d.identifier = "salience";
matthiasm@81 269 d.name = "Salience";
matthiasm@81 270 d.description = "Yin Salience";
matthiasm@81 271 d.hasFixedBinCount = true;
matthiasm@81 272 d.binCount = m_blockSize / 2;
matthiasm@81 273 d.hasKnownExtents = true;
matthiasm@81 274 d.minValue = 0;
matthiasm@81 275 d.maxValue = 1;
matthiasm@81 276 d.isQuantized = false;
matthiasm@81 277 d.sampleType = OutputDescriptor::FixedSampleRate;
matthiasm@81 278 d.sampleRate = (m_inputSampleRate / m_stepSize);
matthiasm@81 279 d.hasDuration = false;
matthiasm@81 280 outputs.push_back(d);
matthiasm@81 281 m_outNoSalience = outputNumber++;
matthiasm@81 282
matthiasm@81 283 return outputs;
matthiasm@81 284 }
matthiasm@81 285
matthiasm@81 286 bool
matthiasm@81 287 YinVamp::initialise(size_t channels, size_t stepSize, size_t blockSize)
matthiasm@81 288 {
matthiasm@81 289 if (channels < getMinChannelCount() ||
matthiasm@81 290 channels > getMaxChannelCount()) return false;
matthiasm@81 291
matthiasm@81 292 /*
matthiasm@81 293 std::cerr << "YinVamp::initialise: channels = " << channels
matthiasm@81 294 << ", stepSize = " << stepSize << ", blockSize = " << blockSize
matthiasm@81 295 << std::endl;
matthiasm@81 296 */
matthiasm@81 297 m_channels = channels;
matthiasm@81 298 m_stepSize = stepSize;
matthiasm@81 299 m_blockSize = blockSize;
matthiasm@81 300
matthiasm@81 301 reset();
matthiasm@81 302
matthiasm@81 303 return true;
matthiasm@81 304 }
matthiasm@81 305
matthiasm@81 306 void
matthiasm@81 307 YinVamp::reset()
matthiasm@81 308 {
matthiasm@81 309 m_yin.setThreshold(m_yinParameter);
matthiasm@81 310 m_yin.setFrameSize(m_blockSize);
matthiasm@81 311 /*
matthiasm@81 312 std::cerr << "YinVamp::reset: yin threshold set to " << (m_yinParameter)
matthiasm@81 313 << ", blockSize = " << m_blockSize
matthiasm@81 314 << std::endl;
matthiasm@81 315 */
matthiasm@81 316 }
matthiasm@81 317
matthiasm@81 318 YinVamp::FeatureSet
matthiasm@81 319 YinVamp::process(const float *const *inputBuffers, RealTime timestamp)
matthiasm@81 320 {
matthiasm@81 321 timestamp = timestamp + Vamp::RealTime::frame2RealTime(m_blockSize/4, lrintf(m_inputSampleRate));
matthiasm@81 322 FeatureSet fs;
matthiasm@81 323
matthiasm@81 324 double *dInputBuffers = new double[m_blockSize];
matthiasm@81 325 for (size_t i = 0; i < m_blockSize; ++i) dInputBuffers[i] = inputBuffers[0][i];
matthiasm@81 326
matthiasm@81 327 Yin::YinOutput yo = m_yin.process(dInputBuffers);
matthiasm@81 328 // std::cerr << "f0 in YinVamp: " << yo.f0 << std::endl;
matthiasm@81 329 Feature f;
matthiasm@81 330 f.hasTimestamp = true;
matthiasm@81 331 f.timestamp = timestamp;
matthiasm@81 332 if (m_outputUnvoiced == 0.0f)
matthiasm@81 333 {
matthiasm@81 334 // std::cerr << "f0 in YinVamp: " << yo.f0 << std::endl;
matthiasm@81 335 if (yo.f0 > 0 && yo.f0 < m_fmax && yo.f0 > m_fmin) {
matthiasm@81 336 f.values.push_back(yo.f0);
matthiasm@81 337 fs[m_outNoF0].push_back(f);
matthiasm@81 338 }
matthiasm@81 339 } else if (m_outputUnvoiced == 1.0f)
matthiasm@81 340 {
matthiasm@81 341 if (fabs(yo.f0) < m_fmax && fabs(yo.f0) > m_fmin) {
matthiasm@81 342 f.values.push_back(fabs(yo.f0));
matthiasm@81 343 fs[m_outNoF0].push_back(f);
matthiasm@81 344 }
matthiasm@81 345 } else
matthiasm@81 346 {
matthiasm@81 347 if (fabs(yo.f0) < m_fmax && fabs(yo.f0) > m_fmin) {
matthiasm@81 348 f.values.push_back(yo.f0);
matthiasm@81 349 fs[m_outNoF0].push_back(f);
matthiasm@81 350 }
matthiasm@81 351 }
matthiasm@81 352
matthiasm@81 353 f.values.clear();
matthiasm@81 354 f.values.push_back(yo.rms);
matthiasm@81 355 fs[m_outNoRms].push_back(f);
matthiasm@81 356
matthiasm@81 357 f.values.clear();
matthiasm@81 358 for (size_t iBin = 0; iBin < yo.salience.size(); ++iBin)
matthiasm@81 359 {
matthiasm@81 360 f.values.push_back(yo.salience[iBin]);
matthiasm@81 361 }
matthiasm@81 362 fs[m_outNoSalience].push_back(f);
matthiasm@81 363
matthiasm@81 364 f.values.clear();
matthiasm@81 365 // f.values[0] = yo.periodicity;
matthiasm@81 366 f.values.push_back(yo.periodicity);
matthiasm@81 367 fs[m_outNoPeriodicity].push_back(f);
matthiasm@81 368
matthiasm@81 369 delete [] dInputBuffers;
matthiasm@81 370
matthiasm@81 371 return fs;
matthiasm@81 372 }
matthiasm@81 373
matthiasm@81 374 YinVamp::FeatureSet
matthiasm@81 375 YinVamp::getRemainingFeatures()
matthiasm@81 376 {
matthiasm@81 377 FeatureSet fs;
matthiasm@81 378 return fs;
matthiasm@81 379 }