yading@10
|
1 function [y] = extractInstrumental(x,w,N,melodyFile)
|
yading@10
|
2 %e.g. y = extractInstrumental(x,hamming(2025),4096,'baby.txt');
|
yading@10
|
3
|
yading@10
|
4
|
yading@10
|
5 % Initialize
|
yading@10
|
6 M = length(w); % analysis window size
|
yading@10
|
7 Ns = 1024; % FFT size for synthesis
|
yading@10
|
8 H = 256; % hop size for analysis and synthesis
|
yading@10
|
9 soundlength = length(x); % length of input sound array
|
yading@10
|
10 hNs = Ns/2; % half synthesis window size
|
yading@10
|
11 hM = (M-1)/2; % half analysis window size
|
yading@10
|
12 pin = max(hNs+1,1+hM); % initialize sound pointer to middle of analysis window
|
yading@10
|
13 pend = soundlength-max(hM,hNs); % last sample to start a frame
|
yading@10
|
14 fftbuffer = zeros(N,1); % initialize buffer for FFT
|
yading@10
|
15 y = zeros(soundlength+Ns/2,1); % output sine component
|
yading@10
|
16 w = w/sum(w); % normalize analysis window
|
yading@10
|
17 sw = zeros(Ns,1);
|
yading@10
|
18 ow = triang(2*H-1); % overlapping window
|
yading@10
|
19 ovidx = Ns/2+1-H+1:Ns/2+H; % overlap indexes
|
yading@10
|
20 sw(ovidx) = ow(1:2*H-1);
|
yading@10
|
21 bh = blackmanharris(Ns); % synthesis window
|
yading@10
|
22 bh = bh ./ sum(bh); % normalize synthesis window
|
yading@10
|
23 sw(ovidx) = sw(ovidx) ./ bh(ovidx);
|
yading@10
|
24
|
yading@10
|
25
|
yading@10
|
26 % Load melody file
|
yading@10
|
27 melody = loadMelodyFile(melodyFile);
|
yading@10
|
28 melody = [melody zeros(2,1000)];
|
yading@10
|
29 i=0;
|
yading@10
|
30
|
yading@10
|
31 % For each segment
|
yading@10
|
32 while pin<pend
|
yading@10
|
33
|
yading@10
|
34 i=i+1;
|
yading@10
|
35
|
yading@10
|
36 % Find predominant pitch for segment
|
yading@10
|
37 melody_seg = melody(:,ceil((pin-hM)/128):round((pin+hM)/128));
|
yading@10
|
38 ind = find(melody_seg(2,:)>150); % Find pitches larger than 150Hz
|
yading@10
|
39 medpitch = median(melody_seg(2,ind)); % Median pitch in segment
|
yading@10
|
40
|
yading@10
|
41
|
yading@10
|
42 % Compute FFT for segment
|
yading@10
|
43 xw = x(pin-hM:pin+hM).*w(1:M); % window the input sound
|
yading@10
|
44 fftbuffer(1:(M+1)/2) = xw((M+1)/2:M); % zero-phase window in fftbuffer
|
yading@10
|
45 fftbuffer(N-(M-1)/2+1:N) = xw(1:(M-1)/2);
|
yading@10
|
46 X = fft(fftbuffer); % compute the FFT
|
yading@10
|
47
|
yading@10
|
48
|
yading@10
|
49 % Keep only the melody for each segment
|
yading@10
|
50 if(~isempty(ind)) % if there is melody, remove the melodic bins
|
yading@10
|
51
|
yading@10
|
52 melodyBinsStart = (medpitch/10.6568) * [1:40];
|
yading@10
|
53 melodyBinsEnd = N + 2 - ((medpitch/10.6568) * [1:40]);
|
yading@10
|
54 melodyBins = round([melodyBinsStart melodyBinsEnd]);
|
yading@10
|
55 melodyBins = [melodyBins (melodyBins-1) (melodyBins+1) (melodyBins-2) (melodyBins+2) (melodyBins-3) (melodyBins+3) (melodyBins-4) (melodyBins+4) (melodyBins-5) (melodyBins+5) (melodyBins-6) (melodyBins+6)];
|
yading@12
|
56
|
yading@12
|
57 ind2 = find(melodyBins>0);
|
yading@12
|
58 melodyBins = melodyBins(ind2);
|
yading@12
|
59
|
yading@10
|
60 X(melodyBins) = 0;
|
yading@10
|
61
|
yading@10
|
62 end;
|
yading@10
|
63
|
yading@10
|
64
|
yading@10
|
65 ri= pin-hNs; % input sound pointer for residual analysis
|
yading@10
|
66 yw = ifft(X);
|
yading@10
|
67 y(ri:ri+Ns-1) = y(ri:ri+Ns-1)+yw(1:Ns).*sw;
|
yading@10
|
68 pin = pin+H;
|
yading@10
|
69
|
yading@10
|
70 end
|
yading@10
|
71
|
yading@10
|
72 y = (max(x)/max(y))*y; % scale y to original amplitude
|
yading@10
|
73
|
yading@10
|
74 %wavwrite(y,44100,'test.wav'); |