Chris@12: /* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */ Chris@12: Chris@12: /* Chris@12: Vamp Chris@12: Chris@12: An API for audio analysis and feature extraction plugins. Chris@12: Chris@12: Centre for Digital Music, Queen Mary, University of London. Chris@12: Copyright 2006 Chris Cannam. Chris@12: Chris@12: Permission is hereby granted, free of charge, to any person Chris@12: obtaining a copy of this software and associated documentation Chris@12: files (the "Software"), to deal in the Software without Chris@12: restriction, including without limitation the rights to use, copy, Chris@12: modify, merge, publish, distribute, sublicense, and/or sell copies Chris@12: of the Software, and to permit persons to whom the Software is Chris@12: furnished to do so, subject to the following conditions: Chris@12: Chris@12: The above copyright notice and this permission notice shall be Chris@12: included in all copies or substantial portions of the Software. Chris@12: Chris@12: THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, Chris@12: EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF Chris@12: MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND Chris@12: NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS BE LIABLE FOR Chris@12: ANY CLAIM, DAMAGES OR OTHER LIABILITY, WHETHER IN AN ACTION OF Chris@12: CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION Chris@12: WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE. Chris@12: Chris@12: Except as contained in this notice, the names of the Centre for Chris@12: Digital Music; Queen Mary, University of London; and Chris Cannam Chris@12: shall not be used in advertising or otherwise to promote the sale, Chris@12: use or other dealings in this Software without prior written Chris@12: authorization. Chris@12: */ Chris@12: Chris@12: #include "PercussionOnsetDetector.h" Chris@12: Chris@12: using std::string; Chris@12: using std::vector; Chris@12: using std::cerr; Chris@12: using std::endl; Chris@12: Chris@12: #include Chris@12: Chris@12: Chris@12: PercussionOnsetDetector::PercussionOnsetDetector(float inputSampleRate) : Chris@12: Plugin(inputSampleRate), Chris@12: m_stepSize(0), Chris@12: m_blockSize(0), Chris@12: m_threshold(3), Chris@12: m_sensitivity(40), Chris@12: m_priorMagnitudes(0), Chris@12: m_dfMinus1(0), Chris@12: m_dfMinus2(0) Chris@12: { Chris@12: } Chris@12: Chris@12: PercussionOnsetDetector::~PercussionOnsetDetector() Chris@12: { Chris@12: delete[] m_priorMagnitudes; Chris@12: } Chris@12: Chris@12: string Chris@12: PercussionOnsetDetector::getIdentifier() const Chris@12: { Chris@12: return "percussiononsets"; Chris@12: } Chris@12: Chris@12: string Chris@12: PercussionOnsetDetector::getName() const Chris@12: { Chris@12: return "Simple Percussion Onset Detector"; Chris@12: } Chris@12: Chris@12: string Chris@12: PercussionOnsetDetector::getDescription() const Chris@12: { Chris@12: return "Detect percussive note onsets by identifying broadband energy rises"; Chris@12: } Chris@12: Chris@12: string Chris@12: PercussionOnsetDetector::getMaker() const Chris@12: { Chris@12: return "Vamp SDK Example Plugins"; Chris@12: } Chris@12: Chris@12: int Chris@12: PercussionOnsetDetector::getPluginVersion() const Chris@12: { Chris@12: return 2; Chris@12: } Chris@12: Chris@12: string Chris@12: PercussionOnsetDetector::getCopyright() const Chris@12: { Chris@12: return "Code copyright 2006 Queen Mary, University of London, after Dan Barry et al 2005. Freely redistributable (BSD license)"; Chris@12: } Chris@12: Chris@12: size_t Chris@12: PercussionOnsetDetector::getPreferredStepSize() const Chris@12: { Chris@12: return 0; Chris@12: } Chris@12: Chris@12: size_t Chris@12: PercussionOnsetDetector::getPreferredBlockSize() const Chris@12: { Chris@12: return 1024; Chris@12: } Chris@12: Chris@12: bool Chris@12: PercussionOnsetDetector::initialise(size_t channels, size_t stepSize, size_t blockSize) Chris@12: { Chris@12: if (channels < getMinChannelCount() || Chris@12: channels > getMaxChannelCount()) return false; Chris@12: Chris@12: m_stepSize = stepSize; Chris@12: m_blockSize = blockSize; Chris@12: Chris@12: m_priorMagnitudes = new float[m_blockSize/2]; Chris@12: Chris@12: for (size_t i = 0; i < m_blockSize/2; ++i) { Chris@12: m_priorMagnitudes[i] = 0.f; Chris@12: } Chris@12: Chris@12: m_dfMinus1 = 0.f; Chris@12: m_dfMinus2 = 0.f; Chris@12: Chris@12: return true; Chris@12: } Chris@12: Chris@12: void Chris@12: PercussionOnsetDetector::reset() Chris@12: { Chris@12: for (size_t i = 0; i < m_blockSize/2; ++i) { Chris@12: m_priorMagnitudes[i] = 0.f; Chris@12: } Chris@12: Chris@12: m_dfMinus1 = 0.f; Chris@12: m_dfMinus2 = 0.f; Chris@12: } Chris@12: Chris@12: PercussionOnsetDetector::ParameterList Chris@12: PercussionOnsetDetector::getParameterDescriptors() const Chris@12: { Chris@12: ParameterList list; Chris@12: Chris@12: ParameterDescriptor d; Chris@12: d.identifier = "threshold"; Chris@12: d.name = "Energy rise threshold"; Chris@12: d.description = "Energy rise within a frequency bin necessary to count toward broadband total"; Chris@12: d.unit = "dB"; Chris@12: d.minValue = 0; Chris@12: d.maxValue = 20; Chris@12: d.defaultValue = 3; Chris@12: d.isQuantized = false; Chris@12: list.push_back(d); Chris@12: Chris@12: d.identifier = "sensitivity"; Chris@12: d.name = "Sensitivity"; Chris@12: d.description = "Sensitivity of peak detector applied to broadband detection function"; Chris@12: d.unit = "%"; Chris@12: d.minValue = 0; Chris@12: d.maxValue = 100; Chris@12: d.defaultValue = 40; Chris@12: d.isQuantized = false; Chris@12: list.push_back(d); Chris@12: Chris@12: return list; Chris@12: } Chris@12: Chris@12: float Chris@12: PercussionOnsetDetector::getParameter(std::string id) const Chris@12: { Chris@12: if (id == "threshold") return m_threshold; Chris@12: if (id == "sensitivity") return m_sensitivity; Chris@12: return 0.f; Chris@12: } Chris@12: Chris@12: void Chris@12: PercussionOnsetDetector::setParameter(std::string id, float value) Chris@12: { Chris@12: if (id == "threshold") { Chris@12: if (value < 0) value = 0; Chris@12: if (value > 20) value = 20; Chris@12: m_threshold = value; Chris@12: } else if (id == "sensitivity") { Chris@12: if (value < 0) value = 0; Chris@12: if (value > 100) value = 100; Chris@12: m_sensitivity = value; Chris@12: } Chris@12: } Chris@12: Chris@12: PercussionOnsetDetector::OutputList Chris@12: PercussionOnsetDetector::getOutputDescriptors() const Chris@12: { Chris@12: OutputList list; Chris@12: Chris@12: OutputDescriptor d; Chris@12: d.identifier = "onsets"; Chris@12: d.name = "Onsets"; Chris@12: d.description = "Percussive note onset locations"; Chris@12: d.unit = ""; Chris@12: d.hasFixedBinCount = true; Chris@12: d.binCount = 0; Chris@12: d.hasKnownExtents = false; Chris@12: d.isQuantized = false; Chris@12: d.sampleType = OutputDescriptor::VariableSampleRate; Chris@12: d.sampleRate = m_inputSampleRate; Chris@12: list.push_back(d); Chris@12: Chris@12: d.identifier = "detectionfunction"; Chris@12: d.name = "Detection Function"; Chris@12: d.description = "Broadband energy rise detection function"; Chris@12: d.binCount = 1; Chris@12: d.isQuantized = true; Chris@12: d.quantizeStep = 1.0; Chris@12: d.sampleType = OutputDescriptor::OneSamplePerStep; Chris@12: list.push_back(d); Chris@12: Chris@12: return list; Chris@12: } Chris@12: Chris@12: PercussionOnsetDetector::FeatureSet Chris@12: PercussionOnsetDetector::process(const float *const *inputBuffers, Chris@12: Vamp::RealTime ts) Chris@12: { Chris@12: if (m_stepSize == 0) { Chris@12: cerr << "ERROR: PercussionOnsetDetector::process: " Chris@12: << "PercussionOnsetDetector has not been initialised" Chris@12: << endl; Chris@12: return FeatureSet(); Chris@12: } Chris@12: Chris@12: int count = 0; Chris@12: Chris@12: for (size_t i = 1; i < m_blockSize/2; ++i) { Chris@12: Chris@12: float real = inputBuffers[0][i*2]; Chris@12: float imag = inputBuffers[0][i*2 + 1]; Chris@12: Chris@12: float sqrmag = real * real + imag * imag; Chris@12: Chris@12: if (m_priorMagnitudes[i] > 0.f) { Chris@12: float diff = 10.f * log10f(sqrmag / m_priorMagnitudes[i]); Chris@12: Chris@12: // std::cout << "i=" << i << ", sqrmag=" << sqrmag << ", prior=" << m_priorMagnitudes[i] << ", diff=" << diff << ", threshold=" << m_threshold << " " << (diff >= m_threshold ? "[*]" : "") << std::endl; Chris@12: Chris@12: if (diff >= m_threshold) ++count; Chris@12: } Chris@12: Chris@12: m_priorMagnitudes[i] = sqrmag; Chris@12: } Chris@12: Chris@12: FeatureSet returnFeatures; Chris@12: Chris@12: Feature detectionFunction; Chris@12: detectionFunction.hasTimestamp = false; Chris@12: detectionFunction.values.push_back(count); Chris@12: returnFeatures[1].push_back(detectionFunction); Chris@12: Chris@12: if (m_dfMinus2 < m_dfMinus1 && Chris@12: m_dfMinus1 >= count && Chris@12: m_dfMinus1 > ((100 - m_sensitivity) * m_blockSize) / 200) { Chris@12: Chris@12: //std::cout << "result at " << ts << "! (count == " << count << ", prev == " << m_dfMinus1 << ")" << std::endl; Chris@12: Chris@12: Feature onset; Chris@12: onset.hasTimestamp = true; Chris@12: onset.timestamp = ts - Vamp::RealTime::frame2RealTime Chris@12: (m_stepSize, int(m_inputSampleRate + 0.5)); Chris@12: returnFeatures[0].push_back(onset); Chris@12: } Chris@12: Chris@12: m_dfMinus2 = m_dfMinus1; Chris@12: m_dfMinus1 = count; Chris@12: Chris@12: return returnFeatures; Chris@12: } Chris@12: Chris@12: PercussionOnsetDetector::FeatureSet Chris@12: PercussionOnsetDetector::getRemainingFeatures() Chris@12: { Chris@12: return FeatureSet(); Chris@12: } Chris@12: