lbajardsilogic@0
|
1 /* -*- c-basic-offset: 4 indent-tabs-mode: nil -*- vi:set ts=8 sts=4 sw=4: */
|
lbajardsilogic@0
|
2
|
lbajardsilogic@0
|
3 /*
|
lbajardsilogic@0
|
4 Sonic Visualiser
|
lbajardsilogic@0
|
5 An audio file viewer and annotation editor.
|
lbajardsilogic@0
|
6 Centre for Digital Music, Queen Mary, University of London.
|
lbajardsilogic@0
|
7 This file copyright 2006 Chris Cannam and QMUL.
|
lbajardsilogic@0
|
8
|
lbajardsilogic@0
|
9 This program is free software; you can redistribute it and/or
|
lbajardsilogic@0
|
10 modify it under the terms of the GNU General Public License as
|
lbajardsilogic@0
|
11 published by the Free Software Foundation; either version 2 of the
|
lbajardsilogic@0
|
12 License, or (at your option) any later version. See the file
|
lbajardsilogic@0
|
13 COPYING included with this distribution for more information.
|
lbajardsilogic@0
|
14 */
|
lbajardsilogic@0
|
15
|
lbajardsilogic@0
|
16 #ifndef _PHASE_VOCODER_TIME_STRETCHER_H_
|
lbajardsilogic@0
|
17 #define _PHASE_VOCODER_TIME_STRETCHER_H_
|
lbajardsilogic@0
|
18
|
lbajardsilogic@0
|
19 #include "base/Window.h"
|
lbajardsilogic@0
|
20 #include "base/RingBuffer.h"
|
lbajardsilogic@0
|
21
|
lbajardsilogic@0
|
22 #include "data/fft/FFTapi.h"
|
lbajardsilogic@0
|
23
|
lbajardsilogic@0
|
24 #include <QMutex>
|
lbajardsilogic@0
|
25
|
lbajardsilogic@0
|
26 /**
|
lbajardsilogic@0
|
27 * A time stretcher that alters the performance speed of audio,
|
lbajardsilogic@0
|
28 * preserving pitch.
|
lbajardsilogic@0
|
29 *
|
lbajardsilogic@0
|
30 * This is based on the straightforward phase vocoder with phase
|
lbajardsilogic@0
|
31 * unwrapping (as in e.g. the DAFX book pp275-), with optional
|
lbajardsilogic@0
|
32 * percussive transient detection to avoid smearing percussive notes
|
lbajardsilogic@0
|
33 * and resynchronise phases, and adding a stream API for real-time
|
lbajardsilogic@0
|
34 * use. Principles and methods from Chris Duxbury, AES 2002 and 2004
|
lbajardsilogic@0
|
35 * thesis; Emmanuel Ravelli, DAFX 2005; Dan Barry, ISSC 2005 on
|
lbajardsilogic@0
|
36 * percussion detection; code by Chris Cannam.
|
lbajardsilogic@0
|
37 */
|
lbajardsilogic@0
|
38
|
lbajardsilogic@0
|
39 class PhaseVocoderTimeStretcher
|
lbajardsilogic@0
|
40 {
|
lbajardsilogic@0
|
41 public:
|
lbajardsilogic@0
|
42 PhaseVocoderTimeStretcher(size_t sampleRate,
|
lbajardsilogic@0
|
43 size_t channels,
|
lbajardsilogic@0
|
44 float ratio,
|
lbajardsilogic@0
|
45 bool sharpen,
|
lbajardsilogic@0
|
46 size_t maxOutputBlockSize);
|
lbajardsilogic@0
|
47 virtual ~PhaseVocoderTimeStretcher();
|
lbajardsilogic@0
|
48
|
lbajardsilogic@0
|
49 /**
|
lbajardsilogic@0
|
50 * Return the number of samples that would need to be added via
|
lbajardsilogic@0
|
51 * putInput in order to provoke the time stretcher into doing some
|
lbajardsilogic@0
|
52 * time stretching and making more output samples available.
|
lbajardsilogic@0
|
53 * This will be an estimate, if transient sharpening is on; the
|
lbajardsilogic@0
|
54 * caller may need to do the put/get/test cycle more than once.
|
lbajardsilogic@0
|
55 */
|
lbajardsilogic@0
|
56 size_t getRequiredInputSamples() const;
|
lbajardsilogic@0
|
57
|
lbajardsilogic@0
|
58 /**
|
lbajardsilogic@0
|
59 * Put (and possibly process) a given number of input samples.
|
lbajardsilogic@0
|
60 * Number should usually equal the value returned from
|
lbajardsilogic@0
|
61 * getRequiredInputSamples().
|
lbajardsilogic@0
|
62 */
|
lbajardsilogic@0
|
63 void putInput(float **input, size_t samples);
|
lbajardsilogic@0
|
64
|
lbajardsilogic@0
|
65 /**
|
lbajardsilogic@0
|
66 * Get the number of processed samples ready for reading.
|
lbajardsilogic@0
|
67 */
|
lbajardsilogic@0
|
68 size_t getAvailableOutputSamples() const;
|
lbajardsilogic@0
|
69
|
lbajardsilogic@0
|
70 /**
|
lbajardsilogic@0
|
71 * Get some processed samples.
|
lbajardsilogic@0
|
72 */
|
lbajardsilogic@0
|
73 void getOutput(float **output, size_t samples);
|
lbajardsilogic@0
|
74
|
lbajardsilogic@0
|
75 //!!! and reset?
|
lbajardsilogic@0
|
76
|
lbajardsilogic@0
|
77 /**
|
lbajardsilogic@0
|
78 * Change the time stretch ratio.
|
lbajardsilogic@0
|
79 */
|
lbajardsilogic@0
|
80 void setRatio(float ratio);
|
lbajardsilogic@0
|
81
|
lbajardsilogic@0
|
82 /**
|
lbajardsilogic@0
|
83 * Get the hop size for input.
|
lbajardsilogic@0
|
84 */
|
lbajardsilogic@0
|
85 size_t getInputIncrement() const { return m_n1; }
|
lbajardsilogic@0
|
86
|
lbajardsilogic@0
|
87 /**
|
lbajardsilogic@0
|
88 * Get the hop size for output.
|
lbajardsilogic@0
|
89 */
|
lbajardsilogic@0
|
90 size_t getOutputIncrement() const { return m_n2; }
|
lbajardsilogic@0
|
91
|
lbajardsilogic@0
|
92 /**
|
lbajardsilogic@0
|
93 * Get the window size for FFT processing.
|
lbajardsilogic@0
|
94 */
|
lbajardsilogic@0
|
95 size_t getWindowSize() const { return m_wlen; }
|
lbajardsilogic@0
|
96
|
lbajardsilogic@0
|
97 /**
|
lbajardsilogic@0
|
98 * Get the stretch ratio.
|
lbajardsilogic@0
|
99 */
|
lbajardsilogic@0
|
100 float getRatio() const { return float(m_n2) / float(m_n1); }
|
lbajardsilogic@0
|
101
|
lbajardsilogic@0
|
102 /**
|
lbajardsilogic@0
|
103 * Return whether this time stretcher will attempt to sharpen transients.
|
lbajardsilogic@0
|
104 */
|
lbajardsilogic@0
|
105 bool getSharpening() const { return m_sharpen; }
|
lbajardsilogic@0
|
106
|
lbajardsilogic@0
|
107 /**
|
lbajardsilogic@0
|
108 * Return the number of channels for this time stretcher.
|
lbajardsilogic@0
|
109 */
|
lbajardsilogic@0
|
110 size_t getChannelCount() const { return m_channels; }
|
lbajardsilogic@0
|
111
|
lbajardsilogic@0
|
112 /**
|
lbajardsilogic@0
|
113 * Get the latency added by the time stretcher, in sample frames.
|
lbajardsilogic@0
|
114 * This will be exact if transient sharpening is off, or approximate
|
lbajardsilogic@0
|
115 * if it is on.
|
lbajardsilogic@0
|
116 */
|
lbajardsilogic@0
|
117 size_t getProcessingLatency() const;
|
lbajardsilogic@0
|
118
|
lbajardsilogic@0
|
119 protected:
|
lbajardsilogic@0
|
120 /**
|
lbajardsilogic@0
|
121 * Process a single phase vocoder frame from "in" into
|
lbajardsilogic@0
|
122 * m_freq[channel].
|
lbajardsilogic@0
|
123 */
|
lbajardsilogic@0
|
124 void analyseBlock(size_t channel, float *in); // into m_freq[channel]
|
lbajardsilogic@0
|
125
|
lbajardsilogic@0
|
126 /**
|
lbajardsilogic@0
|
127 * Examine m_freq[0..m_channels-1] and return whether a percussive
|
lbajardsilogic@0
|
128 * transient is found.
|
lbajardsilogic@0
|
129 */
|
lbajardsilogic@0
|
130 bool isTransient();
|
lbajardsilogic@0
|
131
|
lbajardsilogic@0
|
132 /**
|
lbajardsilogic@0
|
133 * Resynthesise from m_freq[channel] adding in to "out",
|
lbajardsilogic@0
|
134 * adjusting phases on the basis of a prior step size of lastStep.
|
lbajardsilogic@0
|
135 * Also add the window shape in to the modulation array (if
|
lbajardsilogic@0
|
136 * present) -- for use in ensuring the output has the correct
|
lbajardsilogic@0
|
137 * magnitude afterwards.
|
lbajardsilogic@0
|
138 */
|
lbajardsilogic@0
|
139 void synthesiseBlock(size_t channel, float *out, float *modulation,
|
lbajardsilogic@0
|
140 size_t lastStep);
|
lbajardsilogic@0
|
141
|
lbajardsilogic@0
|
142 void initialise();
|
lbajardsilogic@0
|
143 void calculateParameters();
|
lbajardsilogic@0
|
144 void cleanup();
|
lbajardsilogic@0
|
145
|
lbajardsilogic@0
|
146 bool shouldSharpen() {
|
lbajardsilogic@0
|
147 return m_sharpen && (m_ratio > 0.25);
|
lbajardsilogic@0
|
148 }
|
lbajardsilogic@0
|
149
|
lbajardsilogic@0
|
150 size_t m_sampleRate;
|
lbajardsilogic@0
|
151 size_t m_channels;
|
lbajardsilogic@0
|
152 size_t m_maxOutputBlockSize;
|
lbajardsilogic@0
|
153 float m_ratio;
|
lbajardsilogic@0
|
154 bool m_sharpen;
|
lbajardsilogic@0
|
155 size_t m_n1;
|
lbajardsilogic@0
|
156 size_t m_n2;
|
lbajardsilogic@0
|
157 size_t m_wlen;
|
lbajardsilogic@0
|
158 Window<float> *m_analysisWindow;
|
lbajardsilogic@0
|
159 Window<float> *m_synthesisWindow;
|
lbajardsilogic@0
|
160
|
lbajardsilogic@0
|
161 int m_totalCount;
|
lbajardsilogic@0
|
162 int m_transientCount;
|
lbajardsilogic@0
|
163 int m_n2sum;
|
lbajardsilogic@0
|
164
|
lbajardsilogic@0
|
165 float **m_prevPhase;
|
lbajardsilogic@0
|
166 float **m_prevAdjustedPhase;
|
lbajardsilogic@0
|
167
|
lbajardsilogic@0
|
168 float *m_prevTransientMag;
|
lbajardsilogic@0
|
169 int m_prevTransientScore;
|
lbajardsilogic@0
|
170 int m_transientThreshold;
|
lbajardsilogic@0
|
171 bool m_prevTransient;
|
lbajardsilogic@0
|
172
|
lbajardsilogic@0
|
173 float *m_tempbuf;
|
lbajardsilogic@0
|
174 float **m_time;
|
lbajardsilogic@0
|
175 fftf_complex **m_freq;
|
lbajardsilogic@0
|
176 fftf_plan *m_plan;
|
lbajardsilogic@0
|
177 fftf_plan *m_iplan;
|
lbajardsilogic@0
|
178
|
lbajardsilogic@0
|
179 RingBuffer<float> **m_inbuf;
|
lbajardsilogic@0
|
180 RingBuffer<float> **m_outbuf;
|
lbajardsilogic@0
|
181 float **m_mashbuf;
|
lbajardsilogic@0
|
182 float *m_modulationbuf;
|
lbajardsilogic@0
|
183
|
lbajardsilogic@0
|
184 QMutex *m_mutex;
|
lbajardsilogic@0
|
185 };
|
lbajardsilogic@0
|
186
|
lbajardsilogic@0
|
187 #endif
|