annotate sv/audioio/PhaseVocoderTimeStretcher.h @ 282:d9319859a4cf tip

(none)
author benoitrigolleau
date Fri, 31 Oct 2008 11:00:24 +0000
parents fc9323a41f5a
children
rev   line source
lbajardsilogic@0 1 /* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */
lbajardsilogic@0 2
lbajardsilogic@0 3 /*
lbajardsilogic@0 4 Sonic Visualiser
lbajardsilogic@0 5 An audio file viewer and annotation editor.
lbajardsilogic@0 6 Centre for Digital Music, Queen Mary, University of London.
lbajardsilogic@0 7 This file copyright 2006 Chris Cannam and QMUL.
lbajardsilogic@0 8
lbajardsilogic@0 9 This program is free software; you can redistribute it and/or
lbajardsilogic@0 10 modify it under the terms of the GNU General Public License as
lbajardsilogic@0 11 published by the Free Software Foundation; either version 2 of the
lbajardsilogic@0 12 License, or (at your option) any later version. See the file
lbajardsilogic@0 13 COPYING included with this distribution for more information.
lbajardsilogic@0 14 */
lbajardsilogic@0 15
lbajardsilogic@0 16 #ifndef _PHASE_VOCODER_TIME_STRETCHER_H_
lbajardsilogic@0 17 #define _PHASE_VOCODER_TIME_STRETCHER_H_
lbajardsilogic@0 18
lbajardsilogic@0 19 #include "base/Window.h"
lbajardsilogic@0 20 #include "base/RingBuffer.h"
lbajardsilogic@0 21
lbajardsilogic@0 22 #include "data/fft/FFTapi.h"
lbajardsilogic@0 23
lbajardsilogic@0 24 #include <QMutex>
lbajardsilogic@0 25
lbajardsilogic@0 26 /**
lbajardsilogic@0 27 * A time stretcher that alters the performance speed of audio,
lbajardsilogic@0 28 * preserving pitch.
lbajardsilogic@0 29 *
lbajardsilogic@0 30 * This is based on the straightforward phase vocoder with phase
lbajardsilogic@0 31 * unwrapping (as in e.g. the DAFX book pp275-), with optional
lbajardsilogic@0 32 * percussive transient detection to avoid smearing percussive notes
lbajardsilogic@0 33 * and resynchronise phases, and adding a stream API for real-time
lbajardsilogic@0 34 * use. Principles and methods from Chris Duxbury, AES 2002 and 2004
lbajardsilogic@0 35 * thesis; Emmanuel Ravelli, DAFX 2005; Dan Barry, ISSC 2005 on
lbajardsilogic@0 36 * percussion detection; code by Chris Cannam.
lbajardsilogic@0 37 */
lbajardsilogic@0 38
lbajardsilogic@0 39 class PhaseVocoderTimeStretcher
lbajardsilogic@0 40 {
lbajardsilogic@0 41 public:
lbajardsilogic@0 42 PhaseVocoderTimeStretcher(size_t sampleRate,
lbajardsilogic@0 43 size_t channels,
lbajardsilogic@0 44 float ratio,
lbajardsilogic@0 45 bool sharpen,
lbajardsilogic@0 46 size_t maxOutputBlockSize);
lbajardsilogic@0 47 virtual ~PhaseVocoderTimeStretcher();
lbajardsilogic@0 48
lbajardsilogic@0 49 /**
lbajardsilogic@0 50 * Return the number of samples that would need to be added via
lbajardsilogic@0 51 * putInput in order to provoke the time stretcher into doing some
lbajardsilogic@0 52 * time stretching and making more output samples available.
lbajardsilogic@0 53 * This will be an estimate, if transient sharpening is on; the
lbajardsilogic@0 54 * caller may need to do the put/get/test cycle more than once.
lbajardsilogic@0 55 */
lbajardsilogic@0 56 size_t getRequiredInputSamples() const;
lbajardsilogic@0 57
lbajardsilogic@0 58 /**
lbajardsilogic@0 59 * Put (and possibly process) a given number of input samples.
lbajardsilogic@0 60 * Number should usually equal the value returned from
lbajardsilogic@0 61 * getRequiredInputSamples().
lbajardsilogic@0 62 */
lbajardsilogic@0 63 void putInput(float **input, size_t samples);
lbajardsilogic@0 64
lbajardsilogic@0 65 /**
lbajardsilogic@0 66 * Get the number of processed samples ready for reading.
lbajardsilogic@0 67 */
lbajardsilogic@0 68 size_t getAvailableOutputSamples() const;
lbajardsilogic@0 69
lbajardsilogic@0 70 /**
lbajardsilogic@0 71 * Get some processed samples.
lbajardsilogic@0 72 */
lbajardsilogic@0 73 void getOutput(float **output, size_t samples);
lbajardsilogic@0 74
lbajardsilogic@0 75 //!!! and reset?
lbajardsilogic@0 76
lbajardsilogic@0 77 /**
lbajardsilogic@0 78 * Change the time stretch ratio.
lbajardsilogic@0 79 */
lbajardsilogic@0 80 void setRatio(float ratio);
lbajardsilogic@0 81
lbajardsilogic@0 82 /**
lbajardsilogic@0 83 * Get the hop size for input.
lbajardsilogic@0 84 */
lbajardsilogic@0 85 size_t getInputIncrement() const { return m_n1; }
lbajardsilogic@0 86
lbajardsilogic@0 87 /**
lbajardsilogic@0 88 * Get the hop size for output.
lbajardsilogic@0 89 */
lbajardsilogic@0 90 size_t getOutputIncrement() const { return m_n2; }
lbajardsilogic@0 91
lbajardsilogic@0 92 /**
lbajardsilogic@0 93 * Get the window size for FFT processing.
lbajardsilogic@0 94 */
lbajardsilogic@0 95 size_t getWindowSize() const { return m_wlen; }
lbajardsilogic@0 96
lbajardsilogic@0 97 /**
lbajardsilogic@0 98 * Get the stretch ratio.
lbajardsilogic@0 99 */
lbajardsilogic@0 100 float getRatio() const { return float(m_n2) / float(m_n1); }
lbajardsilogic@0 101
lbajardsilogic@0 102 /**
lbajardsilogic@0 103 * Return whether this time stretcher will attempt to sharpen transients.
lbajardsilogic@0 104 */
lbajardsilogic@0 105 bool getSharpening() const { return m_sharpen; }
lbajardsilogic@0 106
lbajardsilogic@0 107 /**
lbajardsilogic@0 108 * Return the number of channels for this time stretcher.
lbajardsilogic@0 109 */
lbajardsilogic@0 110 size_t getChannelCount() const { return m_channels; }
lbajardsilogic@0 111
lbajardsilogic@0 112 /**
lbajardsilogic@0 113 * Get the latency added by the time stretcher, in sample frames.
lbajardsilogic@0 114 * This will be exact if transient sharpening is off, or approximate
lbajardsilogic@0 115 * if it is on.
lbajardsilogic@0 116 */
lbajardsilogic@0 117 size_t getProcessingLatency() const;
lbajardsilogic@0 118
lbajardsilogic@0 119 protected:
lbajardsilogic@0 120 /**
lbajardsilogic@0 121 * Process a single phase vocoder frame from "in" into
lbajardsilogic@0 122 * m_freq[channel].
lbajardsilogic@0 123 */
lbajardsilogic@0 124 void analyseBlock(size_t channel, float *in); // into m_freq[channel]
lbajardsilogic@0 125
lbajardsilogic@0 126 /**
lbajardsilogic@0 127 * Examine m_freq[0..m_channels-1] and return whether a percussive
lbajardsilogic@0 128 * transient is found.
lbajardsilogic@0 129 */
lbajardsilogic@0 130 bool isTransient();
lbajardsilogic@0 131
lbajardsilogic@0 132 /**
lbajardsilogic@0 133 * Resynthesise from m_freq[channel] adding in to "out",
lbajardsilogic@0 134 * adjusting phases on the basis of a prior step size of lastStep.
lbajardsilogic@0 135 * Also add the window shape in to the modulation array (if
lbajardsilogic@0 136 * present) -- for use in ensuring the output has the correct
lbajardsilogic@0 137 * magnitude afterwards.
lbajardsilogic@0 138 */
lbajardsilogic@0 139 void synthesiseBlock(size_t channel, float *out, float *modulation,
lbajardsilogic@0 140 size_t lastStep);
lbajardsilogic@0 141
lbajardsilogic@0 142 void initialise();
lbajardsilogic@0 143 void calculateParameters();
lbajardsilogic@0 144 void cleanup();
lbajardsilogic@0 145
lbajardsilogic@0 146 bool shouldSharpen() {
lbajardsilogic@0 147 return m_sharpen && (m_ratio > 0.25);
lbajardsilogic@0 148 }
lbajardsilogic@0 149
lbajardsilogic@0 150 size_t m_sampleRate;
lbajardsilogic@0 151 size_t m_channels;
lbajardsilogic@0 152 size_t m_maxOutputBlockSize;
lbajardsilogic@0 153 float m_ratio;
lbajardsilogic@0 154 bool m_sharpen;
lbajardsilogic@0 155 size_t m_n1;
lbajardsilogic@0 156 size_t m_n2;
lbajardsilogic@0 157 size_t m_wlen;
lbajardsilogic@0 158 Window<float> *m_analysisWindow;
lbajardsilogic@0 159 Window<float> *m_synthesisWindow;
lbajardsilogic@0 160
lbajardsilogic@0 161 int m_totalCount;
lbajardsilogic@0 162 int m_transientCount;
lbajardsilogic@0 163 int m_n2sum;
lbajardsilogic@0 164
lbajardsilogic@0 165 float **m_prevPhase;
lbajardsilogic@0 166 float **m_prevAdjustedPhase;
lbajardsilogic@0 167
lbajardsilogic@0 168 float *m_prevTransientMag;
lbajardsilogic@0 169 int m_prevTransientScore;
lbajardsilogic@0 170 int m_transientThreshold;
lbajardsilogic@0 171 bool m_prevTransient;
lbajardsilogic@0 172
lbajardsilogic@0 173 float *m_tempbuf;
lbajardsilogic@0 174 float **m_time;
lbajardsilogic@0 175 fftf_complex **m_freq;
lbajardsilogic@0 176 fftf_plan *m_plan;
lbajardsilogic@0 177 fftf_plan *m_iplan;
lbajardsilogic@0 178
lbajardsilogic@0 179 RingBuffer<float> **m_inbuf;
lbajardsilogic@0 180 RingBuffer<float> **m_outbuf;
lbajardsilogic@0 181 float **m_mashbuf;
lbajardsilogic@0 182 float *m_modulationbuf;
lbajardsilogic@0 183
lbajardsilogic@0 184 QMutex *m_mutex;
lbajardsilogic@0 185 };
lbajardsilogic@0 186
lbajardsilogic@0 187 #endif