annotate extractMelody.m @ 13:844d341cf643 tip

Back up before ISMIR
author Yading Song <yading.song@eecs.qmul.ac.uk>
date Thu, 31 Oct 2013 13:17:06 +0000
parents 6840f77b83aa
children
rev   line source
yading@10 1 function [y] = extractMelody(x,w,N,melodyFile)
yading@10 2 %e.g. y = extractMelody(x,hamming(2025),4096,'baby.txt');
yading@10 3
yading@10 4
yading@10 5 % Initialize
yading@10 6 M = length(w); % analysis window size
yading@10 7 Ns = 1024; % FFT size for synthesis
yading@10 8 H = 256; % hop size for analysis and synthesis
yading@10 9 soundlength = length(x); % length of input sound array
yading@10 10 hNs = Ns/2; % half synthesis window size
yading@10 11 hM = (M-1)/2; % half analysis window size
yading@10 12 pin = max(hNs+1,1+hM); % initialize sound pointer to middle of analysis window
yading@10 13 pend = soundlength-max(hM,hNs); % last sample to start a frame
yading@10 14 fftbuffer = zeros(N,1); % initialize buffer for FFT
yading@10 15 y = zeros(soundlength+Ns/2,1); % output sine component
yading@10 16 w = w/sum(w); % normalize analysis window
yading@10 17 sw = zeros(Ns,1);
yading@10 18 ow = triang(2*H-1); % overlapping window
yading@10 19 ovidx = Ns/2+1-H+1:Ns/2+H; % overlap indexes
yading@10 20 sw(ovidx) = ow(1:2*H-1);
yading@10 21 bh = blackmanharris(Ns); % synthesis window
yading@10 22 bh = bh ./ sum(bh); % normalize synthesis window
yading@10 23 sw(ovidx) = sw(ovidx) ./ bh(ovidx);
yading@10 24
yading@10 25
yading@10 26 % Load melody file
yading@10 27 melody = loadMelodyFile(melodyFile);
yading@10 28 melody = [melody zeros(2,1000)];
yading@10 29 i=0;
yading@10 30
yading@10 31 % For each segment
yading@10 32 while pin<pend
yading@10 33
yading@10 34 i=i+1;
yading@10 35
yading@10 36 % Find predominant pitch for segment
yading@10 37 melody_seg = melody(:,ceil((pin-hM)/128):round((pin+hM)/128));
yading@10 38 ind = find(melody_seg(2,:)>150); % Find pitches larger than 150Hz
yading@10 39 medpitch = median(melody_seg(2,ind)); % Median pitch in segment
yading@10 40
yading@10 41
yading@10 42 % Compute FFT for segment
yading@10 43 xw = x(pin-hM:pin+hM).*w(1:M); % window the input sound
yading@10 44 fftbuffer(1:(M+1)/2) = xw((M+1)/2:M); % zero-phase window in fftbuffer
yading@10 45 fftbuffer(N-(M-1)/2+1:N) = xw(1:(M-1)/2);
yading@10 46 X = fft(fftbuffer); % compute the FFT
yading@10 47
yading@10 48 % Keep only the melody for each segment
yading@10 49 if(isempty(ind)) % if there is no melody in segment, then silence segment
yading@10 50 X = zeros(N,1);
yading@10 51 else % if there is melody, then mask everything else
yading@10 52
yading@10 53 melodyBinsStart = (medpitch/10.6568) * [1:40];
yading@10 54 melodyBinsEnd = N + 2 - ((medpitch/10.6568) * [1:40]);
yading@10 55 melodyBins = round([melodyBinsStart melodyBinsEnd]);
yading@10 56 melodyBins = [melodyBins (melodyBins-1) (melodyBins+1) (melodyBins-2) (melodyBins+2) (melodyBins-3) (melodyBins+3) (melodyBins-4) (melodyBins+4) (melodyBins-5) (melodyBins+5) (melodyBins-6) (melodyBins+6)];
yading@10 57
yading@10 58 C = setdiff(1:N,melodyBins);
yading@10 59
yading@10 60 X(C) = 0;
yading@10 61
yading@10 62 end;
yading@10 63
yading@10 64
yading@10 65 ri= pin-hNs; % input sound pointer for residual analysis
yading@10 66 yw = ifft(X);
yading@10 67 y(ri:ri+Ns-1) = y(ri:ri+Ns-1)+yw(1:Ns).*sw;
yading@10 68 pin = pin+H;
yading@10 69
yading@10 70 end
yading@10 71
yading@10 72 y = (max(x)/max(y))*y; % scale y to original amplitude
yading@10 73
yading@10 74 %wavwrite(y,44100,'test.wav');