cannam@97: /* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */ cannam@97: cannam@97: /* cannam@97: Vamp cannam@97: cannam@97: An API for audio analysis and feature extraction plugins. cannam@97: cannam@97: Centre for Digital Music, Queen Mary, University of London. cannam@97: Copyright 2006 Chris Cannam. cannam@97: cannam@97: Permission is hereby granted, free of charge, to any person cannam@97: obtaining a copy of this software and associated documentation cannam@97: files (the "Software"), to deal in the Software without cannam@97: restriction, including without limitation the rights to use, copy, cannam@97: modify, merge, publish, distribute, sublicense, and/or sell copies cannam@97: of the Software, and to permit persons to whom the Software is cannam@97: furnished to do so, subject to the following conditions: cannam@97: cannam@97: The above copyright notice and this permission notice shall be cannam@97: included in all copies or substantial portions of the Software. cannam@97: cannam@97: THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, cannam@97: EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF cannam@97: MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND cannam@97: NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS BE LIABLE FOR cannam@97: ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF cannam@97: CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION cannam@97: WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. cannam@97: cannam@97: Except as contained in this notice, the names of the Centre for cannam@97: Digital Music; Queen Mary, University of London; and Chris Cannam cannam@97: shall not be used in advertising or otherwise to promote the sale, cannam@97: use or other dealings in this Software without prior written cannam@97: authorization. cannam@97: */ cannam@97: cannam@97: #include "PercussionOnsetDetector.h" cannam@97: cannam@97: using std::string; cannam@97: using std::vector; cannam@97: using std::cerr; cannam@97: using std::endl; cannam@97: cannam@97: #include cannam@97: cannam@97: cannam@97: PercussionOnsetDetector::PercussionOnsetDetector(float inputSampleRate) : cannam@97: Plugin(inputSampleRate), cannam@97: m_stepSize(0), cannam@97: m_blockSize(0), cannam@97: m_threshold(3), cannam@97: m_sensitivity(40), cannam@97: m_priorMagnitudes(0), cannam@97: m_dfMinus1(0), cannam@97: m_dfMinus2(0) cannam@97: { cannam@97: } cannam@97: cannam@97: PercussionOnsetDetector::~PercussionOnsetDetector() cannam@97: { cannam@97: delete[] m_priorMagnitudes; cannam@97: } cannam@97: cannam@97: string cannam@97: PercussionOnsetDetector::getIdentifier() const cannam@97: { cannam@97: return "percussiononsets"; cannam@97: } cannam@97: cannam@97: string cannam@97: PercussionOnsetDetector::getName() const cannam@97: { cannam@97: return "Simple Percussion Onset Detector"; cannam@97: } cannam@97: cannam@97: string cannam@97: PercussionOnsetDetector::getDescription() const cannam@97: { cannam@97: return "Detect percussive note onsets by identifying broadband energy rises"; cannam@97: } cannam@97: cannam@97: string cannam@97: PercussionOnsetDetector::getMaker() const cannam@97: { cannam@97: return "Vamp SDK Example Plugins"; cannam@97: } cannam@97: cannam@97: int cannam@97: PercussionOnsetDetector::getPluginVersion() const cannam@97: { cannam@97: return 2; cannam@97: } cannam@97: cannam@97: string cannam@97: PercussionOnsetDetector::getCopyright() const cannam@97: { cannam@97: return "Code copyright 2006 Queen Mary, University of London, after Dan Barry et al 2005. Freely redistributable (BSD license)"; cannam@97: } cannam@97: cannam@97: size_t cannam@97: PercussionOnsetDetector::getPreferredStepSize() const cannam@97: { cannam@97: return 0; cannam@97: } cannam@97: cannam@97: size_t cannam@97: PercussionOnsetDetector::getPreferredBlockSize() const cannam@97: { cannam@97: return 1024; cannam@97: } cannam@97: cannam@97: bool cannam@97: PercussionOnsetDetector::initialise(size_t channels, size_t stepSize, size_t blockSize) cannam@97: { cannam@97: if (channels < getMinChannelCount() || cannam@97: channels > getMaxChannelCount()) return false; cannam@97: cannam@97: m_stepSize = stepSize; cannam@97: m_blockSize = blockSize; cannam@97: cannam@97: m_priorMagnitudes = new float[m_blockSize/2]; cannam@97: cannam@97: for (size_t i = 0; i < m_blockSize/2; ++i) { cannam@97: m_priorMagnitudes[i] = 0.f; cannam@97: } cannam@97: cannam@97: m_dfMinus1 = 0.f; cannam@97: m_dfMinus2 = 0.f; cannam@97: cannam@97: return true; cannam@97: } cannam@97: cannam@97: void cannam@97: PercussionOnsetDetector::reset() cannam@97: { cannam@97: for (size_t i = 0; i < m_blockSize/2; ++i) { cannam@97: m_priorMagnitudes[i] = 0.f; cannam@97: } cannam@97: cannam@97: m_dfMinus1 = 0.f; cannam@97: m_dfMinus2 = 0.f; cannam@97: } cannam@97: cannam@97: PercussionOnsetDetector::ParameterList cannam@97: PercussionOnsetDetector::getParameterDescriptors() const cannam@97: { cannam@97: ParameterList list; cannam@97: cannam@97: ParameterDescriptor d; cannam@97: d.identifier = "threshold"; cannam@97: d.name = "Energy rise threshold"; cannam@97: d.description = "Energy rise within a frequency bin necessary to count toward broadband total"; cannam@97: d.unit = "dB"; cannam@97: d.minValue = 0; cannam@97: d.maxValue = 20; cannam@97: d.defaultValue = 3; cannam@97: d.isQuantized = false; cannam@97: list.push_back(d); cannam@97: cannam@97: d.identifier = "sensitivity"; cannam@97: d.name = "Sensitivity"; cannam@97: d.description = "Sensitivity of peak detector applied to broadband detection function"; cannam@97: d.unit = "%"; cannam@97: d.minValue = 0; cannam@97: d.maxValue = 100; cannam@97: d.defaultValue = 40; cannam@97: d.isQuantized = false; cannam@97: list.push_back(d); cannam@97: cannam@97: return list; cannam@97: } cannam@97: cannam@97: float cannam@97: PercussionOnsetDetector::getParameter(std::string id) const cannam@97: { cannam@97: if (id == "threshold") return m_threshold; cannam@97: if (id == "sensitivity") return m_sensitivity; cannam@97: return 0.f; cannam@97: } cannam@97: cannam@97: void cannam@97: PercussionOnsetDetector::setParameter(std::string id, float value) cannam@97: { cannam@97: if (id == "threshold") { cannam@97: if (value < 0) value = 0; cannam@97: if (value > 20) value = 20; cannam@97: m_threshold = value; cannam@97: } else if (id == "sensitivity") { cannam@97: if (value < 0) value = 0; cannam@97: if (value > 100) value = 100; cannam@97: m_sensitivity = value; cannam@97: } cannam@97: } cannam@97: cannam@97: PercussionOnsetDetector::OutputList cannam@97: PercussionOnsetDetector::getOutputDescriptors() const cannam@97: { cannam@97: OutputList list; cannam@97: cannam@97: OutputDescriptor d; cannam@97: d.identifier = "onsets"; cannam@97: d.name = "Onsets"; cannam@97: d.description = "Percussive note onset locations"; cannam@97: d.unit = ""; cannam@97: d.hasFixedBinCount = true; cannam@97: d.binCount = 0; cannam@97: d.hasKnownExtents = false; cannam@97: d.isQuantized = false; cannam@97: d.sampleType = OutputDescriptor::VariableSampleRate; cannam@97: d.sampleRate = m_inputSampleRate; cannam@97: list.push_back(d); cannam@97: cannam@97: d.identifier = "detectionfunction"; cannam@97: d.name = "Detection Function"; cannam@97: d.description = "Broadband energy rise detection function"; cannam@97: d.binCount = 1; cannam@97: d.isQuantized = true; cannam@97: d.quantizeStep = 1.0; cannam@97: d.sampleType = OutputDescriptor::OneSamplePerStep; cannam@97: list.push_back(d); cannam@97: cannam@97: return list; cannam@97: } cannam@97: cannam@97: PercussionOnsetDetector::FeatureSet cannam@97: PercussionOnsetDetector::process(const float *const *inputBuffers, cannam@97: Vamp::RealTime ts) cannam@97: { cannam@97: if (m_stepSize == 0) { cannam@97: cerr << "ERROR: PercussionOnsetDetector::process: " cannam@97: << "PercussionOnsetDetector has not been initialised" cannam@97: << endl; cannam@97: return FeatureSet(); cannam@97: } cannam@97: cannam@97: int count = 0; cannam@97: cannam@97: for (size_t i = 1; i < m_blockSize/2; ++i) { cannam@97: cannam@97: float real = inputBuffers[0][i*2]; cannam@97: float imag = inputBuffers[0][i*2 + 1]; cannam@97: cannam@97: float sqrmag = real * real + imag * imag; cannam@97: cannam@97: if (m_priorMagnitudes[i] > 0.f) { cannam@97: float diff = 10.f * log10f(sqrmag / m_priorMagnitudes[i]); cannam@97: cannam@97: // std::cout << "i=" << i << ", sqrmag=" << sqrmag << ", prior=" << m_priorMagnitudes[i] << ", diff=" << diff << ", threshold=" << m_threshold << " " << (diff >= m_threshold ? "[*]" : "") << std::endl; cannam@97: cannam@97: if (diff >= m_threshold) ++count; cannam@97: } cannam@97: cannam@97: m_priorMagnitudes[i] = sqrmag; cannam@97: } cannam@97: cannam@97: FeatureSet returnFeatures; cannam@97: cannam@97: Feature detectionFunction; cannam@97: detectionFunction.hasTimestamp = false; cannam@97: detectionFunction.values.push_back(count); cannam@97: returnFeatures[1].push_back(detectionFunction); cannam@97: cannam@97: if (m_dfMinus2 < m_dfMinus1 && cannam@97: m_dfMinus1 >= count && cannam@97: m_dfMinus1 > ((100 - m_sensitivity) * m_blockSize) / 200) { cannam@97: cannam@97: //std::cout << "result at " << ts << "! (count == " << count << ", prev == " << m_dfMinus1 << ")" << std::endl; cannam@97: cannam@97: Feature onset; cannam@97: onset.hasTimestamp = true; cannam@97: onset.timestamp = ts - Vamp::RealTime::frame2RealTime cannam@97: (m_stepSize, int(m_inputSampleRate + 0.5)); cannam@97: returnFeatures[0].push_back(onset); cannam@97: } cannam@97: cannam@97: m_dfMinus2 = m_dfMinus1; cannam@97: m_dfMinus1 = count; cannam@97: cannam@97: return returnFeatures; cannam@97: } cannam@97: cannam@97: PercussionOnsetDetector::FeatureSet cannam@97: PercussionOnsetDetector::getRemainingFeatures() cannam@97: { cannam@97: return FeatureSet(); cannam@97: } cannam@97: