sonic-visualiser: audioio/PhaseVocoderTimeStretcher.cpp comparison

comparison audioio/PhaseVocoderTimeStretcher.cpp @ 25:e74f508db18c

* Add setRatio method to the time stretcher, and make it possible to change the ratio without having to construct and replace the time stretcher. This means we can do it seamlessly. Add a lot more ratios to the time stretch control in the main window

author	Chris Cannam
date	Fri, 15 Sep 2006 15:35:06 +0000
parents	80126455d169
children	d88d117e0c34

comparison

equal deleted inserted replaced

-:ae0731ba8e67
+:e74f508db18c
 #include "PhaseVocoderTimeStretcher.h"
 #include <iostream>
 #include <cassert>
+#include <QMutexLocker>
 //#define DEBUG_PHASE_VOCODER_TIME_STRETCHER 1
 PhaseVocoderTimeStretcher::PhaseVocoderTimeStretcher(size_t sampleRate,
 size_t channels,
 float ratio,
 bool sharpen,
 size_t maxProcessInputBlockSize) :
 m_sampleRate(sampleRate),
 m_channels(channels),
+m_maxProcessInputBlockSize(maxProcessInputBlockSize),
 m_ratio(ratio),
 m_sharpen(sharpen),
 m_totalCount(0),
 m_transientCount(0),
-m_n2sum(0)
+m_n2sum(0),
-{
+m_mutex(new QMutex())
-m_wlen = 1024;
+{
+initialise();
-//!!! In transient sharpening mode, we need to pick the window
-//length so as to be more or less fixed in audio duration (i.e. we
+std::cerr << "PhaseVocoderTimeStretcher: channels = " << m_channels
-//need to exploit the sample rate)
+<< ", ratio = " << m_ratio
+<< ", n1 = " << m_n1 << ", n2 = " << m_n2 << ", wlen = "
-//!!! have to work out the relationship between wlen and transient
+<< m_wlen << ", max = " << maxProcessInputBlockSize
-//threshold
+<< ", outbuflen = " << m_outbuf[0]->getSize() << std::endl;
+}
-if (ratio < 1) {
-if (ratio < 0.4) {
+PhaseVocoderTimeStretcher::~PhaseVocoderTimeStretcher()
-m_n1 = 1024;
+{
-m_wlen = 2048;
+std::cerr << "PhaseVocoderTimeStretcher::~PhaseVocoderTimeStretcher" << std::endl;
-} else if (ratio < 0.8) {
-m_n1 = 512;
+cleanup();
-} else {
-m_n1 = 256;
+delete m_mutex;
 }
-if (m_sharpen) {
-m_wlen = 2048;
+void
-}
+PhaseVocoderTimeStretcher::initialise()
-m_n2 = m_n1 * ratio;
+{
-} else {
+std::cerr << "PhaseVocoderTimeStretcher::initialise" << std::endl;
-if (ratio > 2) {
-m_n2 = 512;
+calculateParameters();
-m_wlen = 4096;
-} else if (ratio > 1.6) {
-m_n2 = 384;
-m_wlen = 2048;
-} else {
-m_n2 = 256;
-}
-if (m_sharpen) {
-if (m_wlen < 2048) m_wlen = 2048;
-}
-m_n1 = m_n2 / ratio;
-}
-m_transientThreshold = m_wlen / 4.5;
 m_analysisWindow = new Window<float>(HanningWindow, m_wlen);
 m_synthesisWindow = new Window<float>(HanningWindow, m_wlen);
 m_prevPhase = new float *[m_channels];
 m_plan[c] = fftwf_plan_dft_r2c_1d(m_wlen, m_time[c], m_freq[c], FFTW_ESTIMATE);
 m_iplan[c] = fftwf_plan_dft_c2r_1d(m_wlen, m_freq[c], m_time[c], FFTW_ESTIMATE);
 m_inbuf[c] = new RingBuffer<float>(m_wlen);
 m_outbuf[c] = new RingBuffer<float>
-(lrintf((maxProcessInputBlockSize + m_wlen) * ratio));
+(lrintf((m_maxProcessInputBlockSize + m_wlen) * m_ratio));
 m_mashbuf[c] = (float *)fftwf_malloc(sizeof(float) * m_wlen);
 for (int i = 0; i < m_wlen; ++i) {
 m_mashbuf[c][i] = 0.0;
 }
 for (int i = 0; i <= m_wlen/2; ++i) {
 m_prevTransientMag[i] = 0.0;
 }
+}
-std::cerr << "PhaseVocoderTimeStretcher: channels = " << channels
-<< ", ratio = " << ratio
+void
-<< ", n1 = " << m_n1 << ", n2 = " << m_n2 << ", wlen = "
+PhaseVocoderTimeStretcher::calculateParameters()
-<< m_wlen << ", max = " << maxProcessInputBlockSize
+{
-<< ", outbuflen = " << m_outbuf[0]->getSize() << std::endl;
+std::cerr << "PhaseVocoderTimeStretcher::calculateParameters" << std::endl;
-}
+m_wlen = 1024;
-PhaseVocoderTimeStretcher::~PhaseVocoderTimeStretcher()
-{
+//!!! In transient sharpening mode, we need to pick the window
-std::cerr << "PhaseVocoderTimeStretcher::~PhaseVocoderTimeStretcher" << std::endl;
+//length so as to be more or less fixed in audio duration (i.e. we
+//need to exploit the sample rate)
+//!!! have to work out the relationship between wlen and transient
+//threshold
+if (m_ratio < 1) {
+if (m_ratio < 0.4) {
+m_n1 = 1024;
+m_wlen = 2048;
+} else if (m_ratio < 0.8) {
+m_n1 = 512;
+} else {
+m_n1 = 256;
+}
+if (m_sharpen) {
+m_wlen = 2048;
+}
+m_n2 = m_n1 * m_ratio;
+} else {
+if (m_ratio > 2) {
+m_n2 = 512;
+m_wlen = 4096;
+} else if (m_ratio > 1.6) {
+m_n2 = 384;
+m_wlen = 2048;
+} else {
+m_n2 = 256;
+}
+if (m_sharpen) {
+if (m_wlen < 2048) m_wlen = 2048;
+}
+m_n1 = m_n2 / m_ratio;
+}
+m_transientThreshold = m_wlen / 4.5;
+}
+void
+PhaseVocoderTimeStretcher::cleanup()
+{
+std::cerr << "PhaseVocoderTimeStretcher::cleanup" << std::endl;
 for (size_t c = 0; c < m_channels; ++c) {
 fftwf_destroy_plan(m_plan[c]);
 fftwf_destroy_plan(m_iplan[c]);
 delete m_analysisWindow;
 delete m_synthesisWindow;
 }
+void
+PhaseVocoderTimeStretcher::setRatio(float ratio)
+{
+QMutexLocker locker(m_mutex);
+float formerRatio = m_ratio;
+size_t formerWlen = m_wlen;
+m_ratio = ratio;
+calculateParameters();
+if (m_wlen == formerWlen) {
+// This is the only container whose size depends on m_ratio
+RingBuffer<float> **newout = new RingBuffer<float> *[m_channels];
+size_t formerSize = m_outbuf[0]->getSize();
+size_t newSize = lrintf((m_maxProcessInputBlockSize + m_wlen) * m_ratio);
+size_t ready = m_outbuf[0]->getReadSpace();
+for (size_t c = 0; c < m_channels; ++c) {
+newout[c] = new RingBuffer<float>(newSize);
+}
+if (ready > 0) {
+size_t copy = std::min(ready, newSize);
+float *tmp = new float[ready];
+for (size_t c = 0; c < m_channels; ++c) {
+m_outbuf[c]->read(tmp, ready);
+newout[c]->write(tmp + ready - copy, copy);
+}
+delete[] tmp;
+}
+for (size_t c = 0; c < m_channels; ++c) {
+delete m_outbuf[c];
+}
+delete[] m_outbuf;
+m_outbuf = newout;
+} else {
+std::cerr << "wlen changed" << std::endl;
+cleanup();
+initialise();
+}
+}
 size_t
 PhaseVocoderTimeStretcher::getProcessingLatency() const
 {
 return getWindowSize() - getInputIncrement();
 }
 }
 size_t
 PhaseVocoderTimeStretcher::getRequiredInputSamples() const
 {
+QMutexLocker locker(m_mutex);
 if (m_inbuf[0]->getReadSpace() >= m_wlen) return 0;
 return m_wlen - m_inbuf[0]->getReadSpace();
 }
 void
 PhaseVocoderTimeStretcher::putInput(float **input, size_t samples)
 {
+QMutexLocker locker(m_mutex);
 // We need to add samples from input to our internal buffer.  When
 // we have m_windowSize samples in the buffer, we can process it,
 // move the samples back by m_n1 and write the output onto our
 // internal output buffer.  If we have (samples * ratio) samples
 // in that, we can write m_n2 of them back to output and return
 }
 size_t
 PhaseVocoderTimeStretcher::getAvailableOutputSamples() const
 {
+QMutexLocker locker(m_mutex);
 return m_outbuf[0]->getReadSpace();
 }
 void
 PhaseVocoderTimeStretcher::getOutput(float **output, size_t samples)
 {
+QMutexLocker locker(m_mutex);
 if (m_outbuf[0]->getReadSpace() < samples) {
 	std::cerr << "WARNING: PhaseVocoderTimeStretcher::getOutput: not enough data (yet?) (" << m_outbuf[0]->getReadSpace() << " < " << samples << ")" << std::endl;
 	size_t fill = samples - m_outbuf[0]->getReadSpace();
 for (size_t c = 0; c < m_channels; ++c) {
 for (size_t i = 0; i < fill; ++i) {

Mercurial > hg > sonic-visualiser

comparison audioio/PhaseVocoderTimeStretcher.cpp @ 25:e74f508db18c